packages/core/src/utils/summarizer.test.ts

/**
 * @license
 * Copyright 2025 Google LLC
 * SPDX-License-Identifier: Apache-2.0
 */

import type { Mock } from 'vitest';
import { describe, it, expect, vi, beforeEach, afterEach } from 'vitest';
import { GeminiClient } from '../core/client.js';
import { Config } from '../config/config.js';
import {
  summarizeToolOutput,
  llmSummarizer,
  defaultSummarizer,
} from './summarizer.js';
import type { ToolResult } from '../tools/tools.js';
import type {
  ModelConfigService,
  ResolvedModelConfig,
} from '../services/modelConfigService.js';
import { DEFAULT_GEMINI_MODEL } from '../config/models.js';
import { debugLogger } from './debugLogger.js';

// Mock GeminiClient and Config constructor
vi.mock('../core/client.js');
vi.mock('../config/config.js');

describe('summarizers', () => {
  let mockGeminiClient: GeminiClient;
  let MockConfig: Mock;
  let mockConfigInstance: Config;
  const abortSignal = new AbortController().signal;
  const mockResolvedConfig = {
    model: 'gemini-pro',
    generateContentConfig: {
      maxOutputTokens: 2000,
    },
  } as unknown as ResolvedModelConfig;

  beforeEach(() => {
    MockConfig = vi.mocked(Config);
    mockConfigInstance = new MockConfig(
      'test-api-key',
      'gemini-pro',
      false,
      '.',
      false,
      undefined,
      false,
      undefined,
      undefined,
      undefined,
    );
    (mockConfigInstance.modelConfigService as unknown) = {
      getResolvedConfig: vi.fn().mockReturnValue(mockResolvedConfig),
    } as unknown as ModelConfigService;

    mockGeminiClient = new GeminiClient(mockConfigInstance);
    (mockGeminiClient.generateContent as Mock) = vi.fn();

    vi.spyOn(console, 'error').mockImplementation(() => {});
    vi.spyOn(debugLogger, 'warn').mockImplementation(() => {});
  });

  afterEach(() => {
    vi.restoreAllMocks();
  });

  describe('summarizeToolOutput', () => {
    it('should return original text if it is shorter than maxLength', async () => {
      const shortText = 'This is a short text.';
      const result = await summarizeToolOutput(
        mockConfigInstance,
        { model: DEFAULT_GEMINI_MODEL },
        shortText,
        mockGeminiClient,
        abortSignal,
      );
      expect(result).toBe(shortText);
      expect(mockGeminiClient.generateContent).not.toHaveBeenCalled();
    });

    it('should return original text if it is empty', async () => {
      const emptyText = '';
      const result = await summarizeToolOutput(
        mockConfigInstance,
        { model: DEFAULT_GEMINI_MODEL },
        emptyText,
        mockGeminiClient,
        abortSignal,
      );
      expect(result).toBe(emptyText);
      expect(mockGeminiClient.generateContent).not.toHaveBeenCalled();
    });

    it('should call generateContent if text is longer than maxLength', async () => {
      const longText = 'This is a very long text.'.repeat(200);
      const summary = 'This is a summary.';
      (mockGeminiClient.generateContent as Mock).mockResolvedValue({
        candidates: [{ content: { parts: [{ text: summary }] } }],
      });
      const result = await summarizeToolOutput(
        mockConfigInstance,
        { model: DEFAULT_GEMINI_MODEL },
        longText,
        mockGeminiClient,
        abortSignal,
      );

      expect(mockGeminiClient.generateContent).toHaveBeenCalledTimes(1);
      expect(result).toBe(summary);
    });

    it('should return original text if generateContent throws an error', async () => {
      const longText = 'This is a very long text.'.repeat(200);
      const error = new Error('API Error');
      (mockGeminiClient.generateContent as Mock).mockRejectedValue(error);

      const result = await summarizeToolOutput(
        mockConfigInstance,
        { model: DEFAULT_GEMINI_MODEL },
        longText,
        mockGeminiClient,
        abortSignal,
      );

      expect(mockGeminiClient.generateContent).toHaveBeenCalledTimes(1);
      expect(result).toBe(longText);
    });

    it('should construct the correct prompt for summarization', async () => {
      const longText = 'This is a very long text.'.repeat(200);
      const summary = 'This is a summary.';
      (mockGeminiClient.generateContent as Mock).mockResolvedValue({
        candidates: [{ content: { parts: [{ text: summary }] } }],
      });
      (mockConfigInstance.modelConfigService as unknown) = {
        getResolvedConfig() {
          return {
            model: 'gemini-pro-limited',
            generateContentConfig: {
              maxOutputTokens: 1000,
            },
          };
        },
      };

      await summarizeToolOutput(
        mockConfigInstance,
        { model: 'gemini-pro-limited' },
        longText,
        mockGeminiClient,
        abortSignal,
      );

      const expectedPrompt = `Summarize the following tool output to be a maximum of 1000 tokens. The summary should be concise and capture the main points of the tool output.

The summarization should be done based on the content that is provided. Here are the basic rules to follow:
1. If the text is a directory listing or any output that is structural, use the history of the conversation to understand the context. Using this context try to understand what information we need from the tool output and return that as a response.
2. If the text is text content and there is nothing structural that we need, summarize the text.
3. If the text is the output of a shell command, use the history of the conversation to understand the context. Using this context try to understand what information we need from the tool output and return a summarization along with the stack trace of any error within the <error></error> tags. The stack trace should be complete and not truncated. If there are warnings, you should include them in the summary within <warning></warning> tags.


Text to summarize:
"${longText}"

Return the summary string which should first contain an overall summarization of text followed by the full stack trace of errors and warnings in the tool output.
`;
      const calledWith = (mockGeminiClient.generateContent as Mock).mock
        .calls[0];
      const contents = calledWith[1];
      expect(contents[0].parts[0].text).toBe(expectedPrompt);
    });
  });

  describe('llmSummarizer', () => {
    it('should summarize tool output using summarizeToolOutput', async () => {
      const toolResult: ToolResult = {
        llmContent: 'This is a very long text.'.repeat(200),
        returnDisplay: '',
      };
      const summary = 'This is a summary.';
      (mockGeminiClient.generateContent as Mock).mockResolvedValue({
        candidates: [{ content: { parts: [{ text: summary }] } }],
      });

      const result = await llmSummarizer(
        mockConfigInstance,
        toolResult,
        mockGeminiClient,
        abortSignal,
      );

      expect(mockGeminiClient.generateContent).toHaveBeenCalledTimes(1);
      expect(result).toBe(summary);
    });

    it('should handle different llmContent types', async () => {
      const longText = 'This is a very long text.'.repeat(200);
      const toolResult: ToolResult = {
        llmContent: [{ text: longText }],
        returnDisplay: '',
      };
      const summary = 'This is a summary.';
      (mockGeminiClient.generateContent as Mock).mockResolvedValue({
        candidates: [{ content: { parts: [{ text: summary }] } }],
      });

      const result = await llmSummarizer(
        mockConfigInstance,
        toolResult,
        mockGeminiClient,
        abortSignal,
      );

      expect(mockGeminiClient.generateContent).toHaveBeenCalledTimes(1);
      const calledWith = (mockGeminiClient.generateContent as Mock).mock
        .calls[0];
      const contents = calledWith[1];
      expect(contents[0].parts[0].text).toContain(`"${longText}"`);
      expect(result).toBe(summary);
    });
  });

  describe('defaultSummarizer', () => {
    it('should stringify the llmContent', async () => {
      const toolResult: ToolResult = {
        llmContent: { text: 'some data' },
        returnDisplay: '',
      };

      const result = await defaultSummarizer(
        mockConfigInstance,
        toolResult,
        mockGeminiClient,
        abortSignal,
      );

      expect(result).toBe(JSON.stringify({ text: 'some data' }));
      expect(mockGeminiClient.generateContent).not.toHaveBeenCalled();
    });
  });
});
Summarize tool call outputs using tool specific summarizers (#3745) 2025-07-11 09:29:08 -07:00			`/**`
			`* @license`
			`* Copyright 2025 Google LLC`
			`* SPDX-License-Identifier: Apache-2.0`
			`*/`

Explict imports & exports with `type` modifier (#3774) 2025-08-26 00:04:53 +02:00			`import type { Mock } from 'vitest';`
			`import { describe, it, expect, vi, beforeEach, afterEach } from 'vitest';`
Summarize tool call outputs using tool specific summarizers (#3745) 2025-07-11 09:29:08 -07:00			`import { GeminiClient } from '../core/client.js';`
			`import { Config } from '../config/config.js';`
			`import {`
			`summarizeToolOutput,`
			`llmSummarizer,`
			`defaultSummarizer,`
			`} from './summarizer.js';`
Explict imports & exports with `type` modifier (#3774) 2025-08-26 00:04:53 +02:00			`import type { ToolResult } from '../tools/tools.js';`
feat(core): Migrate `generateContent` to model configs. (#12834) 2025-11-11 08:10:50 -08:00			`import type {`
			`ModelConfigService,`
			`ResolvedModelConfig,`
			`} from '../services/modelConfigService.js';`
			`import { DEFAULT_GEMINI_MODEL } from '../config/models.js';`
Migrate console to coreEvents.emitFeedback or debugLogger (#15219) 2025-12-29 15:46:10 -05:00			`import { debugLogger } from './debugLogger.js';`
Summarize tool call outputs using tool specific summarizers (#3745) 2025-07-11 09:29:08 -07:00
			`// Mock GeminiClient and Config constructor`
			`vi.mock('../core/client.js');`
			`vi.mock('../config/config.js');`

			`describe('summarizers', () => {`
			`let mockGeminiClient: GeminiClient;`
			`let MockConfig: Mock;`
feat(core): Migrate `generateContent` to model configs. (#12834) 2025-11-11 08:10:50 -08:00			`let mockConfigInstance: Config;`
Summarize tool call outputs using tool specific summarizers (#3745) 2025-07-11 09:29:08 -07:00			`const abortSignal = new AbortController().signal;`
feat(core): Migrate `generateContent` to model configs. (#12834) 2025-11-11 08:10:50 -08:00			`const mockResolvedConfig = {`
			`model: 'gemini-pro',`
			`generateContentConfig: {`
			`maxOutputTokens: 2000,`
			`},`
			`} as unknown as ResolvedModelConfig;`
Summarize tool call outputs using tool specific summarizers (#3745) 2025-07-11 09:29:08 -07:00
			`beforeEach(() => {`
			`MockConfig = vi.mocked(Config);`
feat(core): Migrate `generateContent` to model configs. (#12834) 2025-11-11 08:10:50 -08:00			`mockConfigInstance = new MockConfig(`
Summarize tool call outputs using tool specific summarizers (#3745) 2025-07-11 09:29:08 -07:00			`'test-api-key',`
			`'gemini-pro',`
			`false,`
			`'.',`
			`false,`
			`undefined,`
			`false,`
			`undefined,`
			`undefined,`
			`undefined,`
			`);`
feat(core): Migrate `generateContent` to model configs. (#12834) 2025-11-11 08:10:50 -08:00			`(mockConfigInstance.modelConfigService as unknown) = {`
			`getResolvedConfig: vi.fn().mockReturnValue(mockResolvedConfig),`
			`} as unknown as ModelConfigService;`
Summarize tool call outputs using tool specific summarizers (#3745) 2025-07-11 09:29:08 -07:00
			`mockGeminiClient = new GeminiClient(mockConfigInstance);`
			`(mockGeminiClient.generateContent as Mock) = vi.fn();`

			`vi.spyOn(console, 'error').mockImplementation(() => {});`
Migrate console to coreEvents.emitFeedback or debugLogger (#15219) 2025-12-29 15:46:10 -05:00			`vi.spyOn(debugLogger, 'warn').mockImplementation(() => {});`
Summarize tool call outputs using tool specific summarizers (#3745) 2025-07-11 09:29:08 -07:00			`});`

			`afterEach(() => {`
Migrate console to coreEvents.emitFeedback or debugLogger (#15219) 2025-12-29 15:46:10 -05:00			`vi.restoreAllMocks();`
Summarize tool call outputs using tool specific summarizers (#3745) 2025-07-11 09:29:08 -07:00			`});`

			`describe('summarizeToolOutput', () => {`
			`it('should return original text if it is shorter than maxLength', async () => {`
			`const shortText = 'This is a short text.';`
			`const result = await summarizeToolOutput(`
feat(core): Migrate `generateContent` to model configs. (#12834) 2025-11-11 08:10:50 -08:00			`mockConfigInstance,`
			`{ model: DEFAULT_GEMINI_MODEL },`
Summarize tool call outputs using tool specific summarizers (#3745) 2025-07-11 09:29:08 -07:00			`shortText,`
			`mockGeminiClient,`
			`abortSignal,`
			`);`
			`expect(result).toBe(shortText);`
			`expect(mockGeminiClient.generateContent).not.toHaveBeenCalled();`
			`});`

			`it('should return original text if it is empty', async () => {`
			`const emptyText = '';`
			`const result = await summarizeToolOutput(`
feat(core): Migrate `generateContent` to model configs. (#12834) 2025-11-11 08:10:50 -08:00			`mockConfigInstance,`
			`{ model: DEFAULT_GEMINI_MODEL },`
Summarize tool call outputs using tool specific summarizers (#3745) 2025-07-11 09:29:08 -07:00			`emptyText,`
			`mockGeminiClient,`
			`abortSignal,`
			`);`
			`expect(result).toBe(emptyText);`
			`expect(mockGeminiClient.generateContent).not.toHaveBeenCalled();`
			`});`

			`it('should call generateContent if text is longer than maxLength', async () => {`
			`const longText = 'This is a very long text.'.repeat(200);`
			`const summary = 'This is a summary.';`
			`(mockGeminiClient.generateContent as Mock).mockResolvedValue({`
			`candidates: [{ content: { parts: [{ text: summary }] } }],`
			`});`
			`const result = await summarizeToolOutput(`
feat(core): Migrate `generateContent` to model configs. (#12834) 2025-11-11 08:10:50 -08:00			`mockConfigInstance,`
			`{ model: DEFAULT_GEMINI_MODEL },`
Summarize tool call outputs using tool specific summarizers (#3745) 2025-07-11 09:29:08 -07:00			`longText,`
			`mockGeminiClient,`
			`abortSignal,`
			`);`

			`expect(mockGeminiClient.generateContent).toHaveBeenCalledTimes(1);`
			`expect(result).toBe(summary);`
			`});`

			`it('should return original text if generateContent throws an error', async () => {`
			`const longText = 'This is a very long text.'.repeat(200);`
			`const error = new Error('API Error');`
			`(mockGeminiClient.generateContent as Mock).mockRejectedValue(error);`

			`const result = await summarizeToolOutput(`
feat(core): Migrate `generateContent` to model configs. (#12834) 2025-11-11 08:10:50 -08:00			`mockConfigInstance,`
			`{ model: DEFAULT_GEMINI_MODEL },`
Summarize tool call outputs using tool specific summarizers (#3745) 2025-07-11 09:29:08 -07:00			`longText,`
			`mockGeminiClient,`
			`abortSignal,`
			`);`

			`expect(mockGeminiClient.generateContent).toHaveBeenCalledTimes(1);`
			`expect(result).toBe(longText);`
			`});`

			`it('should construct the correct prompt for summarization', async () => {`
			`const longText = 'This is a very long text.'.repeat(200);`
			`const summary = 'This is a summary.';`
			`(mockGeminiClient.generateContent as Mock).mockResolvedValue({`
			`candidates: [{ content: { parts: [{ text: summary }] } }],`
			`});`
feat(core): Migrate `generateContent` to model configs. (#12834) 2025-11-11 08:10:50 -08:00			`(mockConfigInstance.modelConfigService as unknown) = {`
			`getResolvedConfig() {`
			`return {`
			`model: 'gemini-pro-limited',`
			`generateContentConfig: {`
			`maxOutputTokens: 1000,`
			`},`
			`};`
			`},`
			`};`
Summarize tool call outputs using tool specific summarizers (#3745) 2025-07-11 09:29:08 -07:00
feat(core): Migrate `generateContent` to model configs. (#12834) 2025-11-11 08:10:50 -08:00			`await summarizeToolOutput(`
			`mockConfigInstance,`
			`{ model: 'gemini-pro-limited' },`
			`longText,`
			`mockGeminiClient,`
			`abortSignal,`
			`);`
Summarize tool call outputs using tool specific summarizers (#3745) 2025-07-11 09:29:08 -07:00
Enable tool summarization only when explicitly set in settings.json (#4140) Co-authored-by: matt korwel <matt.korwel@gmail.com> 2025-07-15 10:22:31 -07:00			const expectedPrompt = `Summarize the following tool output to be a maximum of 1000 tokens. The summary should be concise and capture the main points of the tool output.
Summarize tool call outputs using tool specific summarizers (#3745) 2025-07-11 09:29:08 -07:00
			`The summarization should be done based on the content that is provided. Here are the basic rules to follow:`
			`1. If the text is a directory listing or any output that is structural, use the history of the conversation to understand the context. Using this context try to understand what information we need from the tool output and return that as a response.`
			`2. If the text is text content and there is nothing structural that we need, summarize the text.`
			`3. If the text is the output of a shell command, use the history of the conversation to understand the context. Using this context try to understand what information we need from the tool output and return a summarization along with the stack trace of any error within the <error></error> tags. The stack trace should be complete and not truncated. If there are warnings, you should include them in the summary within <warning></warning> tags.`


			`Text to summarize:`
			`"${longText}"`

			`Return the summary string which should first contain an overall summarization of text followed by the full stack trace of errors and warnings in the tool output.`
			`;
			`const calledWith = (mockGeminiClient.generateContent as Mock).mock`
			`.calls[0];`
feat(core): Migrate `generateContent` to model configs. (#12834) 2025-11-11 08:10:50 -08:00			`const contents = calledWith[1];`
Summarize tool call outputs using tool specific summarizers (#3745) 2025-07-11 09:29:08 -07:00			`expect(contents[0].parts[0].text).toBe(expectedPrompt);`
			`});`
			`});`

			`describe('llmSummarizer', () => {`
			`it('should summarize tool output using summarizeToolOutput', async () => {`
			`const toolResult: ToolResult = {`
			`llmContent: 'This is a very long text.'.repeat(200),`
			`returnDisplay: '',`
			`};`
			`const summary = 'This is a summary.';`
			`(mockGeminiClient.generateContent as Mock).mockResolvedValue({`
			`candidates: [{ content: { parts: [{ text: summary }] } }],`
			`});`

			`const result = await llmSummarizer(`
feat(core): Migrate `generateContent` to model configs. (#12834) 2025-11-11 08:10:50 -08:00			`mockConfigInstance,`
Summarize tool call outputs using tool specific summarizers (#3745) 2025-07-11 09:29:08 -07:00			`toolResult,`
			`mockGeminiClient,`
			`abortSignal,`
			`);`

			`expect(mockGeminiClient.generateContent).toHaveBeenCalledTimes(1);`
			`expect(result).toBe(summary);`
			`});`

			`it('should handle different llmContent types', async () => {`
			`const longText = 'This is a very long text.'.repeat(200);`
			`const toolResult: ToolResult = {`
			`llmContent: [{ text: longText }],`
			`returnDisplay: '',`
			`};`
			`const summary = 'This is a summary.';`
			`(mockGeminiClient.generateContent as Mock).mockResolvedValue({`
			`candidates: [{ content: { parts: [{ text: summary }] } }],`
			`});`

			`const result = await llmSummarizer(`
feat(core): Migrate `generateContent` to model configs. (#12834) 2025-11-11 08:10:50 -08:00			`mockConfigInstance,`
Summarize tool call outputs using tool specific summarizers (#3745) 2025-07-11 09:29:08 -07:00			`toolResult,`
			`mockGeminiClient,`
			`abortSignal,`
			`);`

			`expect(mockGeminiClient.generateContent).toHaveBeenCalledTimes(1);`
			`const calledWith = (mockGeminiClient.generateContent as Mock).mock`
			`.calls[0];`
feat(core): Migrate `generateContent` to model configs. (#12834) 2025-11-11 08:10:50 -08:00			`const contents = calledWith[1];`
Summarize tool call outputs using tool specific summarizers (#3745) 2025-07-11 09:29:08 -07:00			expect(contents[0].parts[0].text).toContain(`"${longText}"`);
			`expect(result).toBe(summary);`
			`});`
			`});`

			`describe('defaultSummarizer', () => {`
			`it('should stringify the llmContent', async () => {`
			`const toolResult: ToolResult = {`
			`llmContent: { text: 'some data' },`
			`returnDisplay: '',`
			`};`

			`const result = await defaultSummarizer(`
feat(core): Migrate `generateContent` to model configs. (#12834) 2025-11-11 08:10:50 -08:00			`mockConfigInstance,`
Summarize tool call outputs using tool specific summarizers (#3745) 2025-07-11 09:29:08 -07:00			`toolResult,`
			`mockGeminiClient,`
			`abortSignal,`
			`);`

			`expect(result).toBe(JSON.stringify({ text: 'some data' }));`
			`expect(mockGeminiClient.generateContent).not.toHaveBeenCalled();`
			`});`
			`});`
			`});`