feat(ui): Enhanced agent thinking detection for Ollama models

- Added semantic detection module (agent-status-detection.ts) that analyzes message content for keywords like 'standby', 'processing', 'analyzing' - Updated isAgentThinking() in multi-task-chat to use semantic detection when streaming has technically ended but agent is conceptually working - Added dynamic status messages (PROCESSING, AGENT PROCESSING, etc.) instead of static THINKING/STREAMING labels - Enhanced session-status.ts to check semantic content before returning idle - Fixes issue where Ollama models output status messages and pause, causing UI to incorrectly show ready-to-send state
2025-12-30 02:53:21 +04:00
parent eb863bdde7
commit 942582e981
3 changed files with 292 additions and 3 deletions
--- a/packages/ui/src/components/chat/multi-task-chat.tsx
+++ b/packages/ui/src/components/chat/multi-task-chat.tsx
@@ -10,6 +10,7 @@ import { addToTaskQueue, getSoloState, setActiveTaskId, toggleAutonomous, toggle
 import { getLogger } from "@/lib/logger";
 import { clearCompactionSuggestion, getCompactionSuggestion } from "@/stores/session-compaction";
 import { emitSessionSidebarRequest } from "@/lib/session-sidebar-events";
 import { detectAgentWorkingState, getAgentStatusMessage } from "@/lib/agent-status-detection";
 import {
  Command,
  Plus,
@@ -216,7 +217,36 @@ export default function MultiTaskChat(props: MultiTaskChatProps) {
    const store = messageStore();
    const lastMsg = store.getMessage(ids[ids.length - 1]);
-    return lastMsg?.role === "assistant" && (lastMsg.status === "streaming" || lastMsg.status === "sending");
+
    // Basic check: streaming or sending status
    if (lastMsg?.role === "assistant" && (lastMsg.status === "streaming" || lastMsg.status === "sending")) {
      return true;
    }
    // Enhanced check: semantic detection for "standby", "processing" messages
    // This catches Ollama models that output status messages and pause
    if (lastMsg?.role === "assistant") {
      const workingState = detectAgentWorkingState(lastMsg);
      return workingState.isWorking;
    }
    return false;
  });
  // Get dynamic status message for display
  const agentStatusMessage = createMemo(() => {
    const ids = filteredMessageIds();
    if (ids.length === 0) return "THINKING";
    const store = messageStore();
    const lastMsg = store.getMessage(ids[ids.length - 1]);
    if (!lastMsg || lastMsg.role !== "assistant") {
      return "THINKING";
    }
    const statusMsg = getAgentStatusMessage(lastMsg);
    return statusMsg?.toUpperCase() || "THINKING";
  });
  // Auto-scroll during streaming - DISABLED for performance testing
@@ -539,7 +569,7 @@ export default function MultiTaskChat(props: MultiTaskChatProps) {
          <Show when={isAgentThinking()}>
            <div class="flex items-center space-x-2 px-3 py-1.5 bg-violet-500/15 border border-violet-500/30 rounded-lg animate-pulse shadow-[0_0_20px_rgba(139,92,246,0.2)]">
              <Sparkles size={12} class="text-violet-400 animate-spin" style={{ "animation-duration": "3s" }} />
-              <span class="text-[10px] font-black text-violet-400 uppercase tracking-tight">Streaming</span>
+              <span class="text-[10px] font-black text-violet-400 uppercase tracking-tight">{agentStatusMessage()}</span>
              <span class="text-[10px] font-bold text-violet-300">{formatTokenTotal(tokenStats().used)}</span>
            </div>
          </Show>
@@ -846,7 +876,7 @@ export default function MultiTaskChat(props: MultiTaskChatProps) {
                        <div class="w-1 h-1 bg-indigo-400 rounded-full animate-bounce" style={{ "animation-delay": "150ms" }} />
                        <div class="w-1 h-1 bg-indigo-400 rounded-full animate-bounce" style={{ "animation-delay": "300ms" }} />
                      </div>
-                      <span class="text-[9px] font-bold text-indigo-400">{isAgentThinking() ? "THINKING" : "SENDING"}</span>
+                      <span class="text-[9px] font-bold text-indigo-400">{isSending() ? "SENDING" : agentStatusMessage()}</span>
                    </div>
                  </Show>
                </div>
--- a/packages/ui/src/lib/agent-status-detection.ts
+++ b/packages/ui/src/lib/agent-status-detection.ts
@@ -0,0 +1,249 @@
 /**
 * Agent Status Detection Module
 * 
 * Provides intelligent detection of when an agent is still "working" even after
 * streaming has technically completed. This handles cases where:
 * 1. Agent outputs "standby", "processing", "working" messages
 * 2. Agent is in multi-step reasoning mode
 * 3. Ollama models pause between thinking and output phases
 */
 import type { MessageRecord } from "../stores/message-v2/types"
 // Keywords that indicate the agent is still processing
 const WORKING_KEYWORDS = [
    "standby",
    "stand by",
    "processing",
    "please wait",
    "working on",
    "analyzing",
    "thinking",
    "computing",
    "calculating",
    "evaluating",
    "generating",
    "preparing",
    "loading",
    "fetching",
    "retrieving",
    "in progress",
    "one moment",
    "hold on",
    "just a sec",
    "give me a moment",
    "let me",
    "i'll",
    "i will",
    "checking",
    "scanning",
    "searching",
    "looking",
    "finding"
 ] as const
 // Keywords that indicate the agent has finished
 const COMPLETION_KEYWORDS = [
    "here is",
    "here's",
    "here are",
    "done",
    "complete",
    "finished",
    "result",
    "solution",
    "answer",
    "output",
    "summary",
    "conclusion",
    "final",
    "successfully",
    "implemented",
    "fixed",
    "resolved",
    "created",
    "updated"
 ] as const
 // Patterns that strongly indicate agent is still working
 const WORKING_PATTERNS = [
    /stand\s*by/i,
    /processing\s*(complete\s*)?data/i,
    /please\s+wait/i,
    /working\s+on/i,
    /analyzing/i,
    /\bwait\b/i,
    /\bone\s+moment\b/i,
    /\bhold\s+on\b/i,
    /\.\.\.\s*$/,  // Ends with ellipsis
    /…\s*$/,      // Ends with unicode ellipsis
 ] as const
 /**
 * Extracts text content from a message's parts
 */
 function extractMessageText(message: MessageRecord): string {
    const textParts: string[] = []
    for (const partId of message.partIds) {
        const part = message.parts[partId]
        if (part?.data) {
            const data = part.data as Record<string, unknown>
            if (data.type === "text" && typeof data.text === "string") {
                textParts.push(data.text)
            }
        }
    }
    return textParts.join("\n")
 }
 /**
 * Gets the last N characters of a message for keyword detection
 */
 function getRecentContent(message: MessageRecord, charLimit = 500): string {
    const fullText = extractMessageText(message)
    if (fullText.length <= charLimit) {
        return fullText.toLowerCase()
    }
    return fullText.slice(-charLimit).toLowerCase()
 }
 /**
 * Checks if the message content indicates the agent is still working
 */
 export function detectAgentWorkingState(message: MessageRecord | null | undefined): {
    isWorking: boolean
    reason?: string
    confidence: "high" | "medium" | "low"
 } {
    if (!message) {
        return { isWorking: false, confidence: "high" }
    }
    // If message status is streaming or sending, definitely working
    if (message.status === "streaming" || message.status === "sending") {
        return { isWorking: true, reason: "Active streaming", confidence: "high" }
    }
    // Get recent content to analyze
    const recentContent = getRecentContent(message)
    if (!recentContent) {
        return { isWorking: false, confidence: "high" }
    }
    // Check for working patterns with high confidence
    for (const pattern of WORKING_PATTERNS) {
        if (pattern.test(recentContent)) {
            return {
                isWorking: true,
                reason: `Pattern match: ${pattern.source}`,
                confidence: "high"
            }
        }
    }
    // Check if recent content ends with working keywords
    const lastLine = recentContent.split("\n").pop()?.trim() || ""
    for (const keyword of WORKING_KEYWORDS) {
        if (lastLine.includes(keyword)) {
            // Check if there's also a completion keyword nearby
            const hasCompletionNearby = COMPLETION_KEYWORDS.some(ck =>
                recentContent.slice(-200).includes(ck)
            )
            if (!hasCompletionNearby) {
                return {
                    isWorking: true,
                    reason: `Working keyword: "${keyword}"`,
                    confidence: "medium"
                }
            }
        }
    }
    // Check message age - if very recent and short, might still be working
    const now = Date.now()
    const messageAge = now - message.updatedAt
    const contentLength = extractMessageText(message).length
    // If message was updated very recently (< 2s) and content is short
    if (messageAge < 2000 && contentLength < 100) {
        return {
            isWorking: true,
            reason: "Recently updated with short content",
            confidence: "low"
        }
    }
    return { isWorking: false, confidence: "high" }
 }
 /**
 * Check if the last assistant message indicates agent is still conceptually working
 */
 export function isAgentConceptuallyThinking(
    messages: MessageRecord[],
    lastAssistantMessage: MessageRecord | null | undefined
 ): boolean {
    if (!lastAssistantMessage) {
        return false
    }
    // Check if message status indicates active work
    if (lastAssistantMessage.status === "streaming" ||
        lastAssistantMessage.status === "sending") {
        return true
    }
    // Use semantic detection
    const workingState = detectAgentWorkingState(lastAssistantMessage)
    return workingState.isWorking
 }
 /**
 * Get a user-friendly status message for the current agent state
 */
 export function getAgentStatusMessage(
    message: MessageRecord | null | undefined
 ): string | null {
    if (!message) {
        return null
    }
    const workingState = detectAgentWorkingState(message)
    if (!workingState.isWorking) {
        return null
    }
    if (message.status === "streaming") {
        return "Streaming..."
    }
    if (message.status === "sending") {
        return "Sending..."
    }
    // Based on reason
    if (workingState.reason?.includes("standby") ||
        workingState.reason?.includes("stand by")) {
        return "Agent processing..."
    }
    if (workingState.reason?.includes("processing")) {
        return "Processing..."
    }
    if (workingState.reason?.includes("analyzing")) {
        return "Analyzing..."
    }
    if (workingState.reason?.includes("ellipsis")) {
        return "Thinking..."
    }
    return "Working..."
 }
--- a/packages/ui/src/stores/session-status.ts
+++ b/packages/ui/src/stores/session-status.ts
@@ -4,6 +4,7 @@ import type { MessageRecord } from "./message-v2/types"
 import { sessions } from "./sessions"
 import { getSessionCompactionState } from "./session-compaction"
 import { messageStoreBus } from "./message-v2/bus"
 import { detectAgentWorkingState } from "../lib/agent-status-detection"
 function getSession(instanceId: string, sessionId: string): Session | null {
  const instanceSessions = sessions().get(instanceId)
@@ -159,6 +160,15 @@ export function getSessionStatus(instanceId: string, sessionId: string): Session
    return "working"
  }
  // Enhanced: Check if last assistant message content suggests agent is still working
  // This catches Ollama models that output "standby", "processing" messages and pause
  if (lastRecord && lastRecord.role === "assistant") {
    const workingState = detectAgentWorkingState(lastRecord)
    if (workingState.isWorking && workingState.confidence !== "low") {
      return "working"
    }
  }
  return "idle"
 }