From 47ef10f7802b4e5768bbbe57e9721061af2d1a4e Mon Sep 17 00:00:00 2001
From: digua <i@digua.me>
Date: Thu, 30 Apr 2026 22:08:25 +0800
Subject: [PATCH] =?UTF-8?q?feat:=20=E4=B8=8A=E4=B8=8B=E6=96=87=E5=8E=8B?=
 =?UTF-8?q?=E7=BC=A9=E9=80=BB=E8=BE=91=E4=BC=98=E5=8C=96?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 electron/main/ai/agent/index.ts               |  2 +-
 electron/main/ai/agent/types.ts               |  9 ++-
 electron/main/ai/compression/index.ts         | 41 ++++++++----
 electron/main/ai/conversations.ts             | 37 +++++------
 electron/main/ipc/ai.ts                       | 14 ++--
 electron/preload/apis/ai.ts                   | 10 ++-
 electron/preload/index.d.ts                   | 10 ++-
 electron/shared/types.ts                      |  2 +-
 src/components/AIChat/ChatExplorer.vue        | 11 +++-
 .../AIChat/chat/AIThinkingIndicator.vue       | 20 +++++-
 src/components/AIChat/chat/ChatMessage.vue    | 30 ++++-----
 src/components/AIChat/chat/ChatStatusBar.vue  | 64 +------------------
 src/components/AIChat/utils/chatMessages.ts   | 16 +++--
 src/i18n/locales/en-US/ai.json                |  5 +-
 src/i18n/locales/ja-JP/ai.json                |  5 +-
 src/i18n/locales/zh-CN/ai.json                |  5 +-
 src/i18n/locales/zh-TW/ai.json                |  5 +-
 src/stores/aiChat.ts                          | 18 +++++-
 18 files changed, 168 insertions(+), 136 deletions(-)

diff --git a/electron/main/ai/agent/index.ts b/electron/main/ai/agent/index.ts
index 4e2745a0..0f21d034 100644
--- a/electron/main/ai/agent/index.ts
+++ b/electron/main/ai/agent/index.ts
@@ -23,7 +23,7 @@ import { buildSystemPrompt } from './prompt-builder'
 import { extractThinkingContent, stripToolCallTags } from './content-parser'
 import { AgentEventHandler } from './event-handler'
 
-type SimpleHistoryMessage = { role: 'user' | 'assistant' | 'summary'; content: string }
+type SimpleHistoryMessage = { role: 'user' | 'assistant' | 'system'; content: string }
 
 // Re-export types for external consumers
 export type { AgentConfig, AgentStreamChunk, AgentResult, TokenUsage, AgentRuntimeStatus, SkillContext } from './types'
diff --git a/electron/main/ai/agent/types.ts b/electron/main/ai/agent/types.ts
index effa5c6f..79c949c6 100644
--- a/electron/main/ai/agent/types.ts
+++ b/electron/main/ai/agent/types.ts
@@ -21,7 +21,7 @@ export interface AgentConfig {
  */
 export interface AgentStreamChunk {
   /** chunk 类型 */
-  type: 'content' | 'think' | 'tool_start' | 'tool_result' | 'status' | 'done' | 'error'
+  type: 'content' | 'think' | 'tool_start' | 'tool_result' | 'status' | 'compression_done' | 'done' | 'error'
   /** 文本内容（type=content 时） */
   content?: string
   /** 思考标签名称（type=think 时） */
@@ -42,6 +42,13 @@ export interface AgentStreamChunk {
   usage?: TokenUsage
   /** 运行状态（type=status 时返回） */
   status?: AgentRuntimeStatus
+  /** 压缩结果（type=compression_done 时） */
+  compressionResult?: {
+    summaryContent: string
+    tokensBefore: number
+    tokensAfter: number
+    timestamp: number
+  }
 }
 
 /**
diff --git a/electron/main/ai/compression/index.ts b/electron/main/ai/compression/index.ts
index b3036d4f..97321bcc 100644
--- a/electron/main/ai/compression/index.ts
+++ b/electron/main/ai/compression/index.ts
@@ -5,8 +5,8 @@
  * 核心流程：
  *   1. 计算当前上下文总 token → 未超阈值则跳过
  *   2. 确定缓冲区：最近 bufferSizePercent% context window 的消息原文
- *   3. 缓冲区之前的消息（含旧 summary）→ LLM 压缩为新摘要
- *   4. 写入 ai_message(role='summary')，替换旧 summary
+ *   3. 缓冲区之前的消息（含旧 system 摘要）→ LLM 压缩为新摘要
+ *   4. 写入 ai_message(role='system')，替换旧摘要
  *   5. Thrashing 检查
  */
 
@@ -49,18 +49,21 @@ export interface CompressionResult {
     | 'error'
   tokensBefore?: number
   tokensAfter?: number
+  summaryContent?: string
   error?: string
 }
 
-const DEFAULT_COMPRESSION_PROMPT = `Please compress the following conversation history into a concise summary, preserving key information, decisions, and context.
-Requirements:
-- Preserve key facts, data, names, and conclusions
-- Preserve user preferences and important instructions
-- Preserve time points and important events
-- Output in the same language as the conversation
-- Keep it within {maxTokens} tokens
+const DEFAULT_COMPRESSION_PROMPT = `You are a context compression assistant. Compress the conversation below into a structured summary.
 
-Conversation history:
+STRICT RULES:
+- Output ONLY the summary content. No greetings, no preamble, no meta-commentary, no word/token counts.
+- Use the same language as the conversation.
+- Maximum output length: {maxTokens} tokens. Be concise.
+- Organize by topic/thread when possible.
+- Preserve: key facts, decisions, user preferences, data, names, timestamps, action items.
+- Omit: pleasantries, filler, redundant back-and-forth.
+
+CONVERSATION:
 {messages}`
 
 const DEFAULT_CONTEXT_WINDOW = 128000
@@ -121,7 +124,7 @@ export async function checkAndCompress(
 
     // 构建压缩输入文本
     const compressInput = buildCompressionInput(messagesToCompress, summary)
-    const targetTokens = Math.floor(contextWindow * 0.1)
+    const targetTokens = Math.min(Math.floor(contextWindow * 0.1), 16384)
 
     // 三级降级：独立模型 → 当前模型 → 强制截断
     let summaryText: string | null = null
@@ -158,11 +161,23 @@ export async function checkAndCompress(
         'Compression',
         `Thrashing detected: ${tokensAfter} tokens after compression still >= ${thresholdTokens}`
       )
-      return { compressed: true, reason: 'thrashing', tokensBefore: currentTokens, tokensAfter }
+      return {
+        compressed: true,
+        reason: 'thrashing',
+        tokensBefore: currentTokens,
+        tokensAfter,
+        summaryContent: summaryText,
+      }
     }
 
     aiLogger.info('Compression', `Compressed: ${currentTokens} → ${tokensAfter} tokens`)
-    return { compressed: true, reason: 'success', tokensBefore: currentTokens, tokensAfter }
+    return {
+      compressed: true,
+      reason: 'success',
+      tokensBefore: currentTokens,
+      tokensAfter,
+      summaryContent: summaryText,
+    }
   } catch (error) {
     aiLogger.error('Compression', 'Compression failed', { error: String(error) })
     return { compressed: false, reason: 'error', error: String(error) }
diff --git a/electron/main/ai/conversations.ts b/electron/main/ai/conversations.ts
index 94473a36..6eaaa330 100644
--- a/electron/main/ai/conversations.ts
+++ b/electron/main/ai/conversations.ts
@@ -224,7 +224,7 @@ export type ContentBlock =
 /**
  * AI 消息类型
  */
-export type AIMessageRole = 'user' | 'assistant' | 'summary'
+export type AIMessageRole = 'user' | 'assistant' | 'system'
 
 export interface TokenUsageData {
   promptTokens: number
@@ -509,38 +509,36 @@ export function getConversationTokenUsage(conversationId: string): TokenUsageDat
  * 以避免重复加载已被压缩的旧消息。
  *
  * @param conversationId 对话 ID
- * @param maxMessages 最大返回条数（取最近 N 条，仅对 summary 之后的消息生效）
+ * @param maxMessages 最大返回条数（取最近 N 条，仅对 system 摘要之后的消息生效）
  */
 export function getHistoryForAgent(
   conversationId: string,
   maxMessages?: number
-): Array<{ role: 'user' | 'assistant' | 'summary'; content: string }> {
+): Array<{ role: 'user' | 'assistant' | 'system'; content: string }> {
   const messages = getMessages(conversationId)
   const validMessages = messages.filter(
-    (m) => (m.role === 'user' || m.role === 'assistant' || m.role === 'summary') && m.content?.trim()
+    (m) => (m.role === 'user' || m.role === 'assistant' || m.role === 'system') && m.content?.trim()
   )
 
-  // 查找最新的 summary 消息位置
-  let summaryIndex = -1
+  // 查找最新的 system 消息位置（压缩摘要）
+  let systemIndex = -1
   for (let i = validMessages.length - 1; i >= 0; i--) {
-    if (validMessages[i].role === 'summary') {
-      summaryIndex = i
+    if (validMessages[i].role === 'system') {
+      systemIndex = i
       break
     }
   }
 
-  let result: Array<{ role: 'user' | 'assistant' | 'summary'; content: string }>
+  let result: Array<{ role: 'user' | 'assistant' | 'system'; content: string }>
 
-  if (summaryIndex >= 0) {
-    // 返回 summary + summary 之后的消息
-    result = validMessages.slice(summaryIndex).map((m) => ({ role: m.role, content: m.content }))
+  if (systemIndex >= 0) {
+    result = validMessages.slice(systemIndex).map((m) => ({ role: m.role, content: m.content }))
   } else {
     result = validMessages.map((m) => ({ role: m.role, content: m.content }))
   }
 
   if (maxMessages && result.length > maxMessages) {
-    // 如果有 summary 且它是第一条，保留它再截取后面的
-    if (result.length > 0 && result[0].role === 'summary') {
+    if (result.length > 0 && result[0].role === 'system') {
       const rest = result.slice(1)
       const truncated = rest.slice(-(maxMessages - 1))
       return [result[0], ...truncated]
@@ -553,15 +551,14 @@ export function getHistoryForAgent(
 // ==================== Summary / 压缩专用 ====================
 
 /**
- * 添加 summary 消息并替换旧的 summary（每个对话只保留一条最新 summary）
+ * 添加 system 消息并替换旧的 system（每个对话只保留一条最新压缩摘要）
  */
 export function addSummaryMessage(conversationId: string, content: string): AIMessage {
   const db = getAiDb()
 
-  // 删除该对话中所有旧的 summary 消息
-  db.prepare("DELETE FROM ai_message WHERE conversation_id = ? AND role = 'summary'").run(conversationId)
+  db.prepare("DELETE FROM ai_message WHERE conversation_id = ? AND role = 'system'").run(conversationId)
 
-  return addMessage(conversationId, 'summary', content)
+  return addMessage(conversationId, 'system', content)
 }
 
 /**
@@ -575,7 +572,7 @@ export function getLatestSummary(conversationId: string): AIMessage | null {
     SELECT id, conversation_id as conversationId, role, content, timestamp,
            data_keywords as dataKeywords, data_message_count as dataMessageCount, content_blocks as contentBlocks
     FROM ai_message
-    WHERE conversation_id = ? AND role = 'summary'
+    WHERE conversation_id = ? AND role = 'system'
     ORDER BY timestamp DESC
     LIMIT 1
   `
@@ -607,7 +604,7 @@ export function getLatestSummary(conversationId: string): AIMessage | null {
 }
 
 /**
- * 获取 summary 之后的所有 user/assistant 消息（用于压缩计算）
+ * 获取 system（压缩摘要）之后的所有 user/assistant 消息（用于压缩计算）
  */
 export function getMessagesAfterSummary(
   conversationId: string,
diff --git a/electron/main/ipc/ai.ts b/electron/main/ipc/ai.ts
index 53574161..38ec29e8 100644
--- a/electron/main/ipc/ai.ts
+++ b/electron/main/ipc/ai.ts
@@ -1093,7 +1093,7 @@ export function registerAIHandlers({ win }: IpcContext): void {
               chunk: {
                 type: 'status',
                 status: {
-                  phase: 'preparing',
+                  phase: 'compressing',
                   round: 0,
                   toolsUsed: 0,
                   contextTokens: 0,
@@ -1118,13 +1118,17 @@ export function registerAIHandlers({ win }: IpcContext): void {
 
             aiLogger.info('IPC', `Compression result for ${requestId}`, compressionResult)
 
-            if (compressionResult.compressed) {
+            if (compressionResult.compressed && compressionResult.summaryContent) {
               win.webContents.send('agent:streamChunk', {
                 requestId,
                 chunk: {
-                  type: 'status',
-                  status: 'compressed',
-                  content: `Context compressed: ${compressionResult.tokensBefore} → ${compressionResult.tokensAfter} tokens`,
+                  type: 'compression_done',
+                  compressionResult: {
+                    summaryContent: compressionResult.summaryContent,
+                    tokensBefore: compressionResult.tokensBefore ?? 0,
+                    tokensAfter: compressionResult.tokensAfter ?? 0,
+                    timestamp: Date.now(),
+                  },
                 },
               })
             }
diff --git a/electron/preload/apis/ai.ts b/electron/preload/apis/ai.ts
index 1482aa1e..6eaa392b 100644
--- a/electron/preload/apis/ai.ts
+++ b/electron/preload/apis/ai.ts
@@ -41,7 +41,7 @@ export type ContentBlock =
     }
   | { type: 'skill'; skillId: string; skillName: string }
 
-export type AIMessageRole = 'user' | 'assistant' | 'summary'
+export type AIMessageRole = 'user' | 'assistant' | 'system'
 
 export interface TokenUsageData {
   promptTokens: number
@@ -93,7 +93,7 @@ import type { TokenUsage, AgentRuntimeStatus, SerializedErrorInfo } from '../../
 export type { SerializedErrorInfo } from '../../shared/types'
 
 export interface AgentStreamChunk {
-  type: 'content' | 'think' | 'tool_start' | 'tool_result' | 'status' | 'done' | 'error'
+  type: 'content' | 'think' | 'tool_start' | 'tool_result' | 'status' | 'compression_done' | 'done' | 'error'
   content?: string
   thinkTag?: string
   thinkDurationMs?: number
@@ -103,6 +103,12 @@ export interface AgentStreamChunk {
   status?: AgentRuntimeStatus
   error?: SerializedErrorInfo
   isFinished?: boolean
+  compressionResult?: {
+    summaryContent: string
+    tokensBefore: number
+    tokensAfter: number
+    timestamp: number
+  }
   /** Token 使用量（type=done 时返回累计值） */
   usage?: TokenUsage
 }
diff --git a/electron/preload/index.d.ts b/electron/preload/index.d.ts
index 6cfccc36..54337f11 100644
--- a/electron/preload/index.d.ts
+++ b/electron/preload/index.d.ts
@@ -305,7 +305,7 @@ type AIContentBlock =
     }
   | { type: 'skill'; skillId: string; skillName: string }
 
-type AIMessageRole = 'user' | 'assistant' | 'summary'
+type AIMessageRole = 'user' | 'assistant' | 'system'
 
 interface AITokenUsageData {
   promptTokens: number
@@ -720,7 +720,7 @@ interface RAGConfig {
 
 // Agent 相关类型
 interface AgentStreamChunk {
-  type: 'content' | 'think' | 'tool_start' | 'tool_result' | 'status' | 'done' | 'error'
+  type: 'content' | 'think' | 'tool_start' | 'tool_result' | 'status' | 'compression_done' | 'done' | 'error'
   content?: string
   thinkTag?: string
   thinkDurationMs?: number
@@ -730,6 +730,12 @@ interface AgentStreamChunk {
   status?: AgentRuntimeStatus
   error?: SerializedErrorInfo
   isFinished?: boolean
+  compressionResult?: {
+    summaryContent: string
+    tokensBefore: number
+    tokensAfter: number
+    timestamp: number
+  }
   /** Token 使用量（type=done 时返回累计值） */
   usage?: TokenUsage
 }
diff --git a/electron/shared/types.ts b/electron/shared/types.ts
index b53e2572..b48676c1 100644
--- a/electron/shared/types.ts
+++ b/electron/shared/types.ts
@@ -31,7 +31,7 @@ export interface TokenUsage {
 }
 
 export interface AgentRuntimeStatus {
-  phase: 'preparing' | 'thinking' | 'tool_running' | 'responding' | 'completed' | 'aborted' | 'error'
+  phase: 'compressing' | 'preparing' | 'thinking' | 'tool_running' | 'responding' | 'completed' | 'aborted' | 'error'
   round: number
   toolsUsed: number
   currentTool?: string
diff --git a/src/components/AIChat/ChatExplorer.vue b/src/components/AIChat/ChatExplorer.vue
index 1c47cc99..918bd71d 100644
--- a/src/components/AIChat/ChatExplorer.vue
+++ b/src/components/AIChat/ChatExplorer.vue
@@ -398,7 +398,15 @@ watch(
 
               <!-- QA 对渲染 -->
               <template v-for="pair in qaPairs" :key="pair.id">
-                <div class="qa-pair space-y-6 pb-4">
+                <!-- 独立消息（summary 等非 user/assistant） -->
+                <ChatMessage
+                  v-if="pair.standalone"
+                  :role="pair.standalone.role"
+                  :content="pair.standalone.content"
+                  :timestamp="pair.standalone.timestamp"
+                />
+                <!-- QA 对 -->
+                <div v-else class="qa-pair space-y-6 pb-4">
                   <!-- 用户问题 -->
                   <ChatMessage
                     v-if="pair.user && (pair.user.role === 'user' || pair.user.content)"
@@ -434,6 +442,7 @@ watch(
                 "
                 :current-tool-status="currentToolStatus"
                 :tools-used="toolsUsedInCurrentRound"
+                :agent-status="agentStatus"
               />
             </div>
           </div>
diff --git a/src/components/AIChat/chat/AIThinkingIndicator.vue b/src/components/AIChat/chat/AIThinkingIndicator.vue
index 38199c35..1661ce0b 100644
--- a/src/components/AIChat/chat/AIThinkingIndicator.vue
+++ b/src/components/AIChat/chat/AIThinkingIndicator.vue
@@ -1,5 +1,7 @@
 <script setup lang="ts">
+import { computed } from 'vue'
 import { useI18n } from 'vue-i18n'
+import type { AgentRuntimeStatus } from '@electron/shared/types'
 
 const { t, te } = useI18n()
 
@@ -10,7 +12,7 @@ function localizedToolName(name: string, fallback?: string): string {
 }
 
 // Props
-defineProps<{
+const props = defineProps<{
   // 当前工具执行状态
   currentToolStatus: {
     name: string
@@ -19,11 +21,25 @@ defineProps<{
   } | null
   // 当前轮次已使用的工具列表
   toolsUsed: string[]
+  // Agent 运行状态
+  agentStatus?: AgentRuntimeStatus | null
 }>()
+
+const isCompressing = computed(() => props.agentStatus?.phase === 'compressing')
 </script>
 
 <template>
-  <div class="flex items-start gap-3">
+  <!-- 压缩上下文状态（工具块样式，无气泡包裹） -->
+  <div
+    v-if="isCompressing"
+    class="flex w-fit items-center gap-1.5 rounded-lg bg-gray-100 px-2.5 py-1 text-xs transition-colors dark:bg-gray-800/50"
+  >
+    <UIcon name="i-heroicons-arrow-path" class="h-3.5 w-3.5 shrink-0 animate-spin text-gray-600 dark:text-gray-400" />
+    <span class="font-medium text-gray-600 dark:text-gray-400">{{ t('ai.chat.thinking.compressing') }}</span>
+  </div>
+
+  <!-- 常规思考/工具状态（头像+气泡） -->
+  <div v-else class="flex items-start gap-3">
     <!-- AI 头像 -->
     <div
       class="flex h-8 w-8 shrink-0 items-center justify-center rounded-full bg-linear-to-br from-pink-500 to-pink-600"
diff --git a/src/components/AIChat/chat/ChatMessage.vue b/src/components/AIChat/chat/ChatMessage.vue
index e505e2a2..1d13d0c8 100644
--- a/src/components/AIChat/chat/ChatMessage.vue
+++ b/src/components/AIChat/chat/ChatMessage.vue
@@ -13,7 +13,7 @@ const toast = useToast()
 
 // Props
 const props = defineProps<{
-  role: 'user' | 'assistant' | 'summary'
+  role: 'user' | 'assistant' | 'system'
   content: string
   timestamp: number
   isStreaming?: boolean
@@ -30,7 +30,7 @@ const formattedTime = computed(() => {
 
 // 是否是用户消息
 const isUser = computed(() => props.role === 'user')
-const isSummary = computed(() => props.role === 'summary')
+const isSystem = computed(() => props.role === 'system')
 
 // 创建 markdown-it 实例
 const md = new MarkdownIt({
@@ -302,29 +302,27 @@ async function handleCopyMarkdown() {
 </script>
 
 <template>
-  <div class="flex items-start gap-3" :class="[isUser ? 'flex-row-reverse' : '', isSummary ? 'justify-center' : '']">
+  <div class="flex items-start gap-3" :class="[isUser ? 'flex-row-reverse' : '', isSystem ? 'justify-center' : '']">
     <!-- 消息内容 -->
-    <div :class="[isSummary ? 'w-full min-w-0' : 'max-w-[85%] min-w-0']">
-      <!-- Summary 消息：可折叠的上下文摘要 -->
-      <template v-if="isSummary">
+    <div :class="[isSystem ? 'w-full min-w-0' : 'max-w-[85%] min-w-0']">
+      <!-- System 消息：可折叠的上下文摘要 -->
+      <template v-if="isSystem">
         <details
-          class="w-full rounded-xl border border-purple-200 bg-purple-50/50 dark:border-purple-800/50 dark:bg-purple-900/20"
+          class="w-full rounded-lg border border-gray-200 bg-gray-50/80 dark:border-gray-700/50 dark:bg-gray-800/40"
         >
           <summary
-            class="flex cursor-pointer select-none items-center gap-2 px-4 py-2.5 text-sm font-medium text-purple-700 transition-colors hover:text-purple-900 dark:text-purple-300 dark:hover:text-purple-100"
+            class="flex cursor-pointer select-none items-center gap-2 px-3 py-2 text-xs font-medium text-gray-500 transition-colors hover:text-gray-700 dark:text-gray-400 dark:hover:text-gray-200"
           >
-            <UIcon name="i-heroicons-archive-box-arrow-down" class="h-4 w-4 shrink-0" />
+            <UIcon name="i-heroicons-arrow-path" class="h-3.5 w-3.5 shrink-0" />
             <span>{{ t('ai.chat.message.summary.label') }}</span>
-            <span class="ml-auto text-xs font-normal text-purple-400 dark:text-purple-500">
-              {{ t('ai.chat.message.summary.expand') }}
-            </span>
+            <UIcon name="i-heroicons-chevron-right" class="ml-auto h-3 w-3 transition-transform [[open]>&]:rotate-90" />
           </summary>
-          <div class="border-t border-purple-200/50 px-4 py-3 dark:border-purple-800/30">
+          <div class="border-t border-gray-200/60 px-3 py-2.5 dark:border-gray-700/40">
             <div
-              class="prose prose-sm dark:prose-invert max-w-none text-sm leading-relaxed text-gray-700 dark:text-gray-300"
+              class="prose prose-sm dark:prose-invert max-w-none text-xs leading-relaxed text-gray-600 dark:text-gray-300"
               v-html="renderedContent"
             />
-            <p class="mt-3 text-xs italic text-purple-400 dark:text-purple-500">
+            <p class="mt-2 text-[11px] text-gray-400 dark:text-gray-500">
               {{ t('ai.chat.message.summary.info') }}
             </p>
           </div>
@@ -467,7 +465,7 @@ async function handleCopyMarkdown() {
 
       <!-- 时间戳 + 操作按钮（summary 消息和流式输出中不显示） -->
       <div
-        v-if="!isSummary && !isStreaming"
+        v-if="!isSystem && !isStreaming"
         class="mt-1 flex items-center gap-2 px-1"
         :class="[isUser ? 'flex-row-reverse' : '']"
       >
diff --git a/src/components/AIChat/chat/ChatStatusBar.vue b/src/components/AIChat/chat/ChatStatusBar.vue
index 70b1f251..f18421fe 100644
--- a/src/components/AIChat/chat/ChatStatusBar.vue
+++ b/src/components/AIChat/chat/ChatStatusBar.vue
@@ -45,6 +45,8 @@ const agentPhaseClass = computed(() => {
   if (!props.agentStatus) return 'text-gray-500 bg-gray-100 dark:bg-gray-800 dark:text-gray-300'
 
   switch (props.agentStatus.phase) {
+    case 'compressing':
+      return 'text-purple-600 bg-purple-50 dark:bg-purple-900/30 dark:text-purple-300'
     case 'tool_running':
       return 'text-indigo-600 bg-indigo-50 dark:bg-indigo-900/30 dark:text-indigo-300'
     case 'thinking':
@@ -199,51 +201,6 @@ async function handleExportConversation() {
   }
 }
 
-// 手动压缩上下文
-const isCompressing = ref(false)
-
-async function handleManualCompress() {
-  if (isCompressing.value || !props.currentConversationId) return
-
-  const compressionConfig = aiGlobalSettings.value.contextCompression
-  if (!compressionConfig) return
-
-  isCompressing.value = true
-  try {
-    const result = await window.aiApi.compressContext(
-      props.currentConversationId,
-      {
-        enabled: true,
-        tokenThresholdPercent: compressionConfig.tokenThresholdPercent ?? 75,
-        bufferSizePercent: compressionConfig.bufferSizePercent ?? 20,
-        compressionModelConfigId: compressionConfig.compressionModelConfigId,
-      },
-      ''
-    )
-
-    if (result.success && result.result) {
-      if (result.result.compressed) {
-        toast.success(t('ai.chat.statusBar.compress.success'), {
-          description: t('ai.chat.statusBar.compress.successDesc', {
-            before: result.result.tokensBefore ?? '?',
-            after: result.result.tokensAfter ?? '?',
-          }),
-        })
-      } else {
-        toast.warn(t('ai.chat.statusBar.compress.skipped'), {
-          description: t('ai.chat.statusBar.compress.skippedDesc'),
-        })
-      }
-    } else {
-      toast.fail(t('ai.chat.statusBar.compress.failed'), { description: result.error })
-    }
-  } catch (error) {
-    toast.fail(t('ai.chat.statusBar.compress.failed'), { description: String(error) })
-  } finally {
-    isCompressing.value = false
-  }
-}
-
 // 打开当前 AI 日志文件并定位到文件
 async function openAiLogFile() {
   if (isOpeningLog.value) return
@@ -392,23 +349,6 @@ async function openAiLogFile() {
         <UIcon name="i-heroicons-arrow-down-tray" class="h-3.5 w-3.5" />
         <span class="hidden xl:inline">{{ t('ai.chat.statusBar.export.label') }}</span>
       </button>
-      <!-- 手动压缩按钮 -->
-      <button
-        v-if="aiGlobalSettings.contextCompression?.enabled"
-        class="flex shrink-0 items-center gap-1 rounded-md px-1.5 py-1 text-xs text-gray-400 transition-colors hover:bg-gray-100 hover:text-gray-600 disabled:cursor-not-allowed disabled:opacity-60 dark:hover:bg-gray-800 dark:hover:text-gray-300"
-        :title="t('ai.chat.statusBar.compress.title')"
-        :disabled="isCompressing || !currentConversationId"
-        @click="handleManualCompress"
-      >
-        <UIcon
-          name="i-heroicons-archive-box-arrow-down"
-          class="h-3.5 w-3.5"
-          :class="[isCompressing ? 'animate-pulse' : '']"
-        />
-        <span class="hidden xl:inline">
-          {{ isCompressing ? t('ai.chat.statusBar.compress.compressing') : t('ai.chat.statusBar.compress.label') }}
-        </span>
-      </button>
       <!-- 日志按钮 -->
       <button
         class="flex shrink-0 items-center gap-1 rounded-md px-1.5 py-1 text-xs text-gray-400 transition-colors hover:bg-gray-100 hover:text-gray-600 disabled:cursor-not-allowed disabled:opacity-60 dark:hover:bg-gray-800 dark:hover:text-gray-300"
diff --git a/src/components/AIChat/utils/chatMessages.ts b/src/components/AIChat/utils/chatMessages.ts
index 46d7b2e7..31ae1c40 100644
--- a/src/components/AIChat/utils/chatMessages.ts
+++ b/src/components/AIChat/utils/chatMessages.ts
@@ -3,10 +3,12 @@ import type { ChatMessage } from '@/stores/aiChat'
 export interface QAPair {
   user: ChatMessage | null
   assistant: ChatMessage | null
+  /** 非 user/assistant 的独立消息（system 压缩摘要等） */
+  standalone: ChatMessage | null
   id: string
 }
 
-/** 将消息列表分组为 QA 对（用户问题 + AI 回复） */
+/** 将消息列表分组为 QA 对（用户问题 + AI 回复），其他角色作为独立项 */
 export function groupMessagesToQAPairs(messages: ChatMessage[]): QAPair[] {
   const pairs: QAPair[] = []
   let currentUser: ChatMessage | null = null
@@ -14,17 +16,23 @@ export function groupMessagesToQAPairs(messages: ChatMessage[]): QAPair[] {
   for (const msg of messages) {
     if (msg.role === 'user') {
       if (currentUser) {
-        pairs.push({ user: currentUser, assistant: null, id: currentUser.id })
+        pairs.push({ user: currentUser, assistant: null, standalone: null, id: currentUser.id })
       }
       currentUser = msg
     } else if (msg.role === 'assistant') {
-      pairs.push({ user: currentUser, assistant: msg, id: currentUser?.id || msg.id })
+      pairs.push({ user: currentUser, assistant: msg, standalone: null, id: currentUser?.id || msg.id })
       currentUser = null
+    } else {
+      if (currentUser) {
+        pairs.push({ user: currentUser, assistant: null, standalone: null, id: currentUser.id })
+        currentUser = null
+      }
+      pairs.push({ user: null, assistant: null, standalone: msg, id: msg.id })
     }
   }
 
   if (currentUser) {
-    pairs.push({ user: currentUser, assistant: null, id: currentUser.id })
+    pairs.push({ user: currentUser, assistant: null, standalone: null, id: currentUser.id })
   }
 
   return pairs
diff --git a/src/i18n/locales/en-US/ai.json b/src/i18n/locales/en-US/ai.json
index ace53246..254a1180 100644
--- a/src/i18n/locales/en-US/ai.json
+++ b/src/i18n/locales/en-US/ai.json
@@ -120,7 +120,8 @@
     "thinking": {
       "processingResult": "Processing result",
       "called": "Called:",
-      "analyzing": "Analyzing question..."
+      "analyzing": "Analyzing question...",
+      "compressing": "Compressing context..."
     },
     "statusBar": {
       "preset": {
@@ -145,6 +146,7 @@
         "contextTokens": "Context",
         "stats": "seg {segment} · tags {tags}",
         "phase": {
+          "compressing": "Compressing",
           "preparing": "Preparing",
           "thinking": "Thinking",
           "tool_running": "Running tool",
@@ -154,6 +156,7 @@
           "error": "Error"
         },
         "phaseShort": {
+          "compressing": "Compress",
           "preparing": "Prep",
           "thinking": "Think",
           "tool_running": "Tool",
diff --git a/src/i18n/locales/ja-JP/ai.json b/src/i18n/locales/ja-JP/ai.json
index 73552131..ec00cd7f 100644
--- a/src/i18n/locales/ja-JP/ai.json
+++ b/src/i18n/locales/ja-JP/ai.json
@@ -120,7 +120,8 @@
     "thinking": {
       "processingResult": "結果を整理中",
       "called": "実行したツール:",
-      "analyzing": "問題を分析中..."
+      "analyzing": "問題を分析中...",
+      "compressing": "コンテキストを圧縮中..."
     },
     "statusBar": {
       "preset": {
@@ -145,6 +146,7 @@
         "contextTokens": "コンテキスト",
         "stats": "セグメント {segment} ・タグ {tags}",
         "phase": {
+          "compressing": "圧縮中",
           "preparing": "準備中",
           "thinking": "思考中",
           "tool_running": "ツール実行中",
@@ -154,6 +156,7 @@
           "error": "エラー"
         },
         "phaseShort": {
+          "compressing": "圧縮",
           "preparing": "準備",
           "thinking": "思考",
           "tool_running": "ツール",
diff --git a/src/i18n/locales/zh-CN/ai.json b/src/i18n/locales/zh-CN/ai.json
index 7d2d518b..382aacfe 100644
--- a/src/i18n/locales/zh-CN/ai.json
+++ b/src/i18n/locales/zh-CN/ai.json
@@ -120,7 +120,8 @@
     "thinking": {
       "processingResult": "处理结果中",
       "called": "已调用:",
-      "analyzing": "正在分析问题..."
+      "analyzing": "正在分析问题...",
+      "compressing": "正在压缩上下文..."
     },
     "statusBar": {
       "preset": {
@@ -145,6 +146,7 @@
         "contextTokens": "上下文",
         "stats": "段 {segment} · 标签 {tags}",
         "phase": {
+          "compressing": "压缩上下文",
           "preparing": "准备中",
           "thinking": "思考中",
           "tool_running": "调用工具",
@@ -154,6 +156,7 @@
           "error": "错误"
         },
         "phaseShort": {
+          "compressing": "压缩",
           "preparing": "准备",
           "thinking": "思考",
           "tool_running": "工具",
diff --git a/src/i18n/locales/zh-TW/ai.json b/src/i18n/locales/zh-TW/ai.json
index 73ee7378..deb27be0 100644
--- a/src/i18n/locales/zh-TW/ai.json
+++ b/src/i18n/locales/zh-TW/ai.json
@@ -120,7 +120,8 @@
     "thinking": {
       "processingResult": "正在整理結果",
       "called": "已執行：",
-      "analyzing": "正在分析問題..."
+      "analyzing": "正在分析問題...",
+      "compressing": "正在壓縮上下文..."
     },
     "statusBar": {
       "preset": {
@@ -145,6 +146,7 @@
         "contextTokens": "上下文",
         "stats": "段 {segment} · 標籤 {tags}",
         "phase": {
+          "compressing": "壓縮上下文",
           "preparing": "準備中",
           "thinking": "思考中",
           "tool_running": "工具執行中",
@@ -154,6 +156,7 @@
           "error": "錯誤"
         },
         "phaseShort": {
+          "compressing": "壓縮",
           "preparing": "準備",
           "thinking": "思考",
           "tool_running": "工具",
diff --git a/src/stores/aiChat.ts b/src/stores/aiChat.ts
index 56416851..bc63c343 100644
--- a/src/stores/aiChat.ts
+++ b/src/stores/aiChat.ts
@@ -54,7 +54,7 @@ export type ContentBlock =
 // 消息类型
 export interface ChatMessage {
   id: string
-  role: 'user' | 'assistant' | 'summary'
+  role: 'user' | 'assistant' | 'system'
   content: string
   timestamp: number
   dataSource?: {
@@ -658,7 +658,7 @@ export const useAIChatStore = defineStore('aiChatRuntime', () => {
         })
       }
       targetBuffer.messages.push(aiMessage)
-      const aiMessageIndex = targetBuffer.messages.length - 1
+      let aiMessageIndex = targetBuffer.messages.length - 1
       let hasStreamError = false
 
       const updateAIMessage = (updates: Partial<ChatMessage>) => {
@@ -863,6 +863,20 @@ export const useAIChatStore = defineStore('aiChatRuntime', () => {
               }
               break
 
+            case 'compression_done':
+              if (chunk.compressionResult) {
+                const systemMsg: ChatMessage = {
+                  id: `system-${Date.now()}`,
+                  role: 'system',
+                  content: chunk.compressionResult.summaryContent,
+                  timestamp: chunk.compressionResult.timestamp,
+                }
+                const insertIdx = Math.max(0, targetBuffer.messages.length - 1)
+                targetBuffer.messages.splice(insertIdx, 0, systemMsg)
+                aiMessageIndex++
+              }
+              break
+
             case 'done':
               state.currentToolStatus = null
               if (chunk.usage) {