special handling for summarized thinking

2025-12-22 09:47:47 +00:00 · 2025-12-22 14:07:23 +08:00
parent fefc138485
commit 87d8d82be7
12 changed files with 187 additions and 42 deletions
--- a/packages/cli/src/gemini.tsx
+++ b/packages/cli/src/gemini.tsx
@@ -4,12 +4,8 @@
 * SPDX-License-Identifier: Apache-2.0
 */

-import type { Config ,
-  AuthType} from '@qwen-code/qwen-code-core';
-import {
-  InputFormat,
-  logUserPrompt,
-} from '@qwen-code/qwen-code-core';
+import type { Config, AuthType } from '@qwen-code/qwen-code-core';
+import { InputFormat, logUserPrompt } from '@qwen-code/qwen-code-core';
 import { render } from 'ink';
 import dns from 'node:dns';
 import os from 'node:os';
--- a/packages/cli/src/ui/hooks/useGeminiStream.ts
+++ b/packages/cli/src/ui/hooks/useGeminiStream.ts
@@ -769,11 +769,17 @@ export const useGeminiStream = (
      for await (const event of stream) {
        switch (event.type) {
          case ServerGeminiEventType.Thought:
-            thoughtBuffer = handleThoughtEvent(
-              event.value,
-              thoughtBuffer,
-              userMessageTimestamp,
-            );
+            // If the thought has a subject, it's a discrete status update rather than
+            // a streamed textual thought, so we update the thought state directly.
+            if (event.value.subject) {
+              setThought(event.value);
+            } else {
+              thoughtBuffer = handleThoughtEvent(
+                event.value,
+                thoughtBuffer,
+                userMessageTimestamp,
+              );
+            }
            break;
          case ServerGeminiEventType.Content:
            geminiMessageBuffer = handleContentEvent(
@@ -844,6 +850,7 @@ export const useGeminiStream = (
      handleMaxSessionTurnsEvent,
      handleSessionTokenLimitExceededEvent,
      handleCitationEvent,
+      setThought,
    ],
  );

--- a/packages/core/src/config/config.ts
+++ b/packages/core/src/config/config.ts
@@ -16,8 +16,8 @@ import { ProxyAgent, setGlobalDispatcher } from 'undici';
 import type {
  ContentGenerator,
  ContentGeneratorConfig,
-
-  AuthType} from '../core/contentGenerator.js';
+  AuthType,
+} from '../core/contentGenerator.js';
 import type { FallbackModelHandler } from '../fallback/types.js';
 import type { MCPOAuthConfig } from '../mcp/oauth-provider.js';
 import type { ShellExecutionConfig } from '../services/shellExecutionService.js';
--- a/packages/core/src/core/contentGenerator.ts
+++ b/packages/core/src/core/contentGenerator.ts
@@ -32,6 +32,8 @@ export interface ContentGenerator {
  countTokens(request: CountTokensParameters): Promise<CountTokensResponse>;

  embedContent(request: EmbedContentParameters): Promise<EmbedContentResponse>;
+
+  useSummarizedThinking(): boolean;
 }

 export enum AuthType {
--- a/packages/core/src/core/geminiChat.test.ts
+++ b/packages/core/src/core/geminiChat.test.ts
@@ -100,6 +100,7 @@ describe('GeminiChat', () => {
      countTokens: vi.fn(),
      embedContent: vi.fn(),
      batchEmbedContents: vi.fn(),
+      useSummarizedThinking: vi.fn().mockReturnValue(false),
    } as unknown as ContentGenerator;

    mockHandleFallback.mockClear();
@@ -718,6 +719,99 @@ describe('GeminiChat', () => {
        1,
      );
    });
+
+    it('should handle summarized thinking by conditionally including thoughts in history', async () => {
+      // Case 1: useSummarizedThinking is true -> thoughts NOT in history
+      vi.mocked(mockContentGenerator.useSummarizedThinking).mockReturnValue(
+        true,
+      );
+      const stream1 = (async function* () {
+        yield {
+          candidates: [
+            {
+              content: {
+                role: 'model',
+                parts: [{ thought: true, text: 'T1' }, { text: 'A1' }],
+              },
+              finishReason: 'STOP',
+            },
+          ],
+        } as unknown as GenerateContentResponse;
+      })();
+      vi.mocked(mockContentGenerator.generateContentStream).mockResolvedValue(
+        stream1,
+      );
+
+      const res1 = await chat.sendMessageStream('m1', { message: 'h1' }, 'p1');
+      for await (const _ of res1);
+
+      const history1 = chat.getHistory();
+      expect(history1[1].parts).toEqual([{ text: 'A1' }]);
+
+      // Case 2: useSummarizedThinking is false -> thoughts ARE in history
+      chat.clearHistory();
+      vi.mocked(mockContentGenerator.useSummarizedThinking).mockReturnValue(
+        false,
+      );
+      const stream2 = (async function* () {
+        yield {
+          candidates: [
+            {
+              content: {
+                role: 'model',
+                parts: [{ thought: true, text: 'T2' }, { text: 'A2' }],
+              },
+              finishReason: 'STOP',
+            },
+          ],
+        } as unknown as GenerateContentResponse;
+      })();
+      vi.mocked(mockContentGenerator.generateContentStream).mockResolvedValue(
+        stream2,
+      );
+
+      const res2 = await chat.sendMessageStream('m1', { message: 'h1' }, 'p2');
+      for await (const _ of res2);
+
+      const history2 = chat.getHistory();
+      expect(history2[1].parts).toEqual([
+        { text: 'T2', thought: true },
+        { text: 'A2' },
+      ]);
+    });
+
+    it('should keep parts with thoughtSignature when consolidating history', async () => {
+      const stream = (async function* () {
+        yield {
+          candidates: [
+            {
+              content: {
+                role: 'model',
+                parts: [
+                  {
+                    text: 'p1',
+                    thoughtSignature: 's1',
+                  } as unknown as { text: string; thoughtSignature: string },
+                ],
+              },
+              finishReason: 'STOP',
+            },
+          ],
+        } as unknown as GenerateContentResponse;
+      })();
+      vi.mocked(mockContentGenerator.generateContentStream).mockResolvedValue(
+        stream,
+      );
+
+      const res = await chat.sendMessageStream('m1', { message: 'h1' }, 'p1');
+      for await (const _ of res);
+
+      const history = chat.getHistory();
+      expect(history[1].parts![0]).toEqual({
+        text: 'p1',
+        thoughtSignature: 's1',
+      });
+    });
  });

  describe('addHistory', () => {
@@ -1532,7 +1626,7 @@ describe('GeminiChat', () => {
  });

  describe('stripThoughtsFromHistory', () => {
-    it('should strip thought signatures', () => {
+    it('should strip thoughts and thought signatures, and remove empty content objects', () => {
      chat.setHistory([
        {
          role: 'user',
@@ -1544,10 +1638,15 @@ describe('GeminiChat', () => {
            { text: 'thinking...', thought: true },
            { text: 'hi' },
            {
-              functionCall: { name: 'test', args: {} },
-            },
+              text: 'hidden metadata',
+              thoughtSignature: 'abc',
+            } as unknown as { text: string; thoughtSignature: string },
          ],
        },
+        {
+          role: 'model',
+          parts: [{ text: 'only thinking', thought: true }],
+        },
      ]);

      chat.stripThoughtsFromHistory();
@@ -1559,7 +1658,7 @@ describe('GeminiChat', () => {
        },
        {
          role: 'model',
-          parts: [{ text: 'hi' }, { functionCall: { name: 'test', args: {} } }],
+          parts: [{ text: 'hi' }, { text: 'hidden metadata' }],
        },
      ]);
    });
--- a/packages/core/src/core/geminiChat.ts
+++ b/packages/core/src/core/geminiChat.ts
@@ -109,18 +109,24 @@ function isValidContent(content: Content): boolean {
    if (part === undefined || Object.keys(part).length === 0) {
      return false;
    }
-    if (
-      !part.thought &&
-      part.text !== undefined &&
-      part.text === '' &&
-      part.functionCall === undefined
-    ) {
+    if (!isValidContentPart(part)) {
      return false;
    }
  }
  return true;
 }

+function isValidContentPart(part: Part): boolean {
+  const isInvalid =
+    !part.thought &&
+    !part.thoughtSignature &&
+    part.text !== undefined &&
+    part.text === '' &&
+    part.functionCall === undefined;
+
+  return !isInvalid;
+}
+
 /**
 * Validates the history contains the correct roles.
 *
@@ -448,15 +454,29 @@ export class GeminiChat {
        if (!content.parts) return content;

        // Filter out thought parts entirely
-        const filteredParts = content.parts.filter(
-          (part) =>
-            !(
+        const filteredParts = content.parts
+          .filter(
+            (part) =>
+              !(
+                part &&
+                typeof part === 'object' &&
+                'thought' in part &&
+                part.thought
+              ),
+          )
+          .map((part) => {
+            if (
              part &&
              typeof part === 'object' &&
-              'thought' in part &&
-              part.thought
-            ),
-        );
+              'thoughtSignature' in part
+            ) {
+              const newPart = { ...part };
+              delete (newPart as { thoughtSignature?: string })
+                .thoughtSignature;
+              return newPart;
+            }
+            return part;
+          });

        return {
          ...content,
@@ -538,11 +558,15 @@ export class GeminiChat {
      yield chunk; // Yield every chunk to the UI immediately.
    }

-    const thoughtParts = allModelParts.filter((part) => part.thought);
-    const thoughtText = thoughtParts
-      .map((part) => part.text)
-      .join('')
-      .trim();
+    let thoughtText = '';
+    // Only include thoughts if not using summarized thinking.
+    if (!this.config.getContentGenerator().useSummarizedThinking()) {
+      thoughtText = allModelParts
+        .filter((part) => part.thought)
+        .map((part) => part.text)
+        .join('')
+        .trim();
+    }

    const contentParts = allModelParts.filter((part) => !part.thought);
    const consolidatedHistoryParts: Part[] = [];
@@ -555,7 +579,7 @@ export class GeminiChat {
        isValidNonThoughtTextPart(part)
      ) {
        lastPart.text += part.text;
-      } else {
+      } else if (isValidContentPart(part)) {
        consolidatedHistoryParts.push(part);
      }
    }
--- a/packages/core/src/core/geminiContentGenerator/geminiContentGenerator.ts
+++ b/packages/core/src/core/geminiContentGenerator/geminiContentGenerator.ts
@@ -137,4 +137,8 @@ export class GeminiContentGenerator implements ContentGenerator {
  ): Promise<EmbedContentResponse> {
    return this.googleGenAI.models.embedContent(request);
  }
+
+  useSummarizedThinking(): boolean {
+    return true;
+  }
 }
--- a/packages/core/src/core/geminiContentGenerator/loggingContentGenerator.ts
+++ b/packages/core/src/core/geminiContentGenerator/loggingContentGenerator.ts
@@ -209,6 +209,10 @@ export class LoggingContentGenerator implements ContentGenerator {
    return this.wrapped.embedContent(req);
  }

+  useSummarizedThinking(): boolean {
+    return this.wrapped.useSummarizedThinking();
+  }
+
  private toContents(contents: ContentListUnion): Content[] {
    if (Array.isArray(contents)) {
      // it's a Content[] or a PartsUnion[]
--- a/packages/core/src/core/openaiContentGenerator/openaiContentGenerator.ts
+++ b/packages/core/src/core/openaiContentGenerator/openaiContentGenerator.ts
@@ -154,4 +154,8 @@ export class OpenAIContentGenerator implements ContentGenerator {
      );
    }
  }
+
+  useSummarizedThinking(): boolean {
+    return false;
+  }
 }
--- a/packages/core/src/core/turn.ts
+++ b/packages/core/src/core/turn.ts
@@ -27,7 +27,11 @@ import {
  toFriendlyError,
 } from '../utils/errors.js';
 import type { GeminiChat } from './geminiChat.js';
-import { getThoughtText, type ThoughtSummary } from '../utils/thoughtUtils.js';
+import {
+  getThoughtText,
+  parseThought,
+  type ThoughtSummary,
+} from '../utils/thoughtUtils.js';

 // Define a structure for tools passed to the server
 export interface ServerTool {
@@ -266,11 +270,11 @@ export class Turn {
          this.currentResponseId = resp.responseId;
        }

-        const thoughtPart = getThoughtText(resp);
-        if (thoughtPart) {
+        const thoughtText = getThoughtText(resp);
+        if (thoughtText) {
          yield {
            type: GeminiEventType.Thought,
-            value: { subject: '', description: thoughtPart },
+            value: parseThought(thoughtText),
          };
          continue;
        }
--- a/packages/core/src/utils/nextSpeakerChecker.test.ts
+++ b/packages/core/src/utils/nextSpeakerChecker.test.ts
@@ -61,6 +61,7 @@ describe('checkNextSpeaker', () => {
        generateContentStream: vi.fn(),
        countTokens: vi.fn(),
        embedContent: vi.fn(),
+        useSummarizedThinking: vi.fn().mockReturnValue(false),
      } as ContentGenerator,
      {} as Config,
    );
--- a/packages/core/src/utils/thoughtUtils.ts
+++ b/packages/core/src/utils/thoughtUtils.ts
@@ -29,7 +29,7 @@ export function parseThought(rawText: string): ThoughtSummary {
  const startIndex = rawText.indexOf(START_DELIMITER);
  if (startIndex === -1) {
    // No start delimiter found, the whole text is the description.
-    return { subject: '', description: rawText.trim() };
+    return { subject: '', description: rawText };
  }

  const endIndex = rawText.indexOf(
@@ -39,7 +39,7 @@ export function parseThought(rawText: string): ThoughtSummary {
  if (endIndex === -1) {
    // Start delimiter found but no end delimiter, so it's not a valid subject.
    // Treat the entire string as the description.
-    return { subject: '', description: rawText.trim() };
+    return { subject: '', description: rawText };
  }

  const subject = rawText