fix(stage-ui,stage-web): emit literals asap and show streaming messages (#451)

sumimakito · web-flow · commit 36d74ca37b10 · 2025-08-26T20:32:04.000+09:00
diff --git a/apps/stage-web/src/components/Widgets/ChatHistory.vue b/apps/stage-web/src/components/Widgets/ChatHistory.vue
@@ -8,7 +8,7 @@ import { useI18n } from 'vue-i18n'
 const chatHistoryRef = ref<HTMLDivElement>()
 
 const { t } = useI18n()
-const { messages, sending } = storeToRefs(useChatStore())
+const { messages, sending, streamingMessage } = storeToRefs(useChatStore())
 
 const { onBeforeMessageComposed, onTokenLiteral } = useChatStore()
 
@@ -104,6 +104,33 @@ onTokenLiteral(async () => {
           </div>
         </div>
       </div>
+      <div v-if="sending" flex mr="12">
+        <div
+          flex="~ col" border="2 solid primary-200/50 dark:primary-500/50" shadow="md primary-200/50 dark:none" min-w-20
+          rounded-lg px-2 py-1 h="unset <sm:fit" bg="<md:primary-500/25"
+        >
+          <div>
+            <span text-xs text="primary-400/90 dark:primary-600/90" font-normal class="inline <sm:hidden">{{ t('stage.chat.message.character-name.airi') }}</span>
+          </div>
+          <div v-if="streamingMessage.content" class="break-words" text="xs primary-400">
+            <div v-for="(slice, sliceIndex) in streamingMessage.slices" :key="sliceIndex">
+              <div v-if="slice.type === 'tool-call'">
+                <div
+                  p="1" border="1 solid primary-200" rounded-lg m="y-1" bg="primary-100"
+                >
+                  Called: <code>{{ slice.toolCall.toolName }}</code>
+                </div>
+              </div>
+              <div v-else-if="slice.type === 'tool-call-result'" /> <!-- this line should be unreachable -->
+              <MarkdownRenderer
+                v-else
+                :content="slice.text"
+              />
+            </div>
+          </div>
+          <div v-else i-eos-icons:three-dots-loading />
+        </div>
+      </div>
     </div>
   </div>
 </template>
diff --git a/packages/stage-ui/src/composables/llmmarkerParser.ts b/packages/stage-ui/src/composables/llmmarkerParser.ts
@@ -1,3 +1,6 @@
+const TAG_OPEN = '<|'
+const TAG_CLOSE = '|>'
+
 /**
  * A streaming parser for LLM responses that contain special markers (e.g., for tool calls).
  * This composable is designed to be efficient and robust, using a regular expression
@@ -15,9 +18,15 @@
 export function useLlmmarkerParser(options: {
   onLiteral?: (literal: string) => void | Promise<void>
   onSpecial?: (special: string) => void | Promise<void>
+  /**
+   * The minimum length of text required to emit a literal part.
+   * Useful for avoiding emitting literal parts too fast.
+   */
+  minLiteralEmitLength?: number
 }) {
+  const minLiteralEmitLength = Math.max(1, options.minLiteralEmitLength ?? 1)
   let buffer = ''
-  const tagRegex = /(<\|.*?\|>)/
+  let inTag = false
 
   return {
     /**
@@ -29,27 +38,35 @@ export function useLlmmarkerParser(options: {
     async consume(textPart: string) {
       buffer += textPart
 
-      // The regex splits the buffer by tags, keeping the tags in the result array.
-      const parts = buffer.split(tagRegex)
-
-      // The last element of the array is the remainder of the string after the last
-      // complete tag. It could be a partial literal or a partial tag. We keep it
-      // in the buffer for the next consume call.
-      const processableParts = parts.slice(0, -1)
-      buffer = parts[parts.length - 1] || ''
+      while (buffer.length > 0) {
+        if (!inTag) {
+          const openTagIndex = buffer.indexOf(TAG_OPEN)
+          if (openTagIndex < 0) {
+            if (buffer.length - 1 >= minLiteralEmitLength) {
+              const emit = buffer.slice(0, -1)
+              buffer = buffer[buffer.length - 1]
+              await options.onLiteral?.(emit)
+            }
+            break
+          }
 
-      for (const part of processableParts) {
-        if (!part)
-          continue // Skip empty strings that can result from the split.
-
-        // Check if the part is a tag or a literal.
-        if (tagRegex.test(part)) {
-          // Extract the content from inside the tag and pass it to the callback.
-          const specialContent = part.slice(2, -2)
-          await options.onSpecial?.(specialContent)
+          if (openTagIndex > 0) {
+            const emit = buffer.slice(0, openTagIndex)
+            buffer = buffer.slice(openTagIndex)
+            await options.onLiteral?.(emit)
+          }
+          inTag = true
         }
         else {
-          await options.onLiteral?.(part)
+          const closeTagIndex = buffer.indexOf(TAG_CLOSE)
+          if (closeTagIndex < 0) {
+            break
+          }
+
+          const emit = buffer.slice(0, closeTagIndex + TAG_CLOSE.length)
+          buffer = buffer.slice(closeTagIndex + TAG_CLOSE.length)
+          await options.onSpecial?.(emit)
+          inTag = false
         }
       }
     },
@@ -60,7 +77,8 @@ export function useLlmmarkerParser(options: {
      * This should be called after the stream has ended.
      */
     async end() {
-      if (buffer) {
+      // Incomplete tag should not be emitted as literals.
+      if (!inTag && buffer.length > 0) {
         await options.onLiteral?.(buffer)
         buffer = ''
       }
diff --git a/packages/stage-ui/src/stores/chat.ts b/packages/stage-ui/src/stores/chat.ts
@@ -141,6 +141,7 @@ export const useChatStore = defineStore('chat', () => {
             await hook(special)
           }
         },
+        minLiteralEmitLength: 24, // Avoid emitting literals too fast. This is a magic number and can be changed later.
       })
 
       const toolCallQueue = useQueue<ChatSlices>({

Original file line number	Diff line number	Diff line change
`@@ -141,6 +141,7 @@ export const useChatStore = defineStore('chat', () => {`
`141`	`141`	`await hook(special)`
`142`	`142`	`}`
`143`	`143`	`},`
	`144`	`+ minLiteralEmitLength: 24, // Avoid emitting literals too fast. This is a magic number and can be changed later.`
`144`	`145`	`})`
`145`	`146`
`146`	`147`	`const toolCallQueue = useQueue<ChatSlices>({`