feat(core): Migrate generateContent to model configs. (#12834)

This commit is contained in:
joshualitt
2025-11-11 08:10:50 -08:00
committed by GitHub
parent cbbf565121
commit a4415f15d3
15 changed files with 169 additions and 95 deletions
+46 -9
View File
@@ -14,6 +14,11 @@ import {
defaultSummarizer,
} from './summarizer.js';
import type { ToolResult } from '../tools/tools.js';
import type {
ModelConfigService,
ResolvedModelConfig,
} from '../services/modelConfigService.js';
import { DEFAULT_GEMINI_MODEL } from '../config/models.js';
// Mock GeminiClient and Config constructor
vi.mock('../core/client.js');
@@ -22,11 +27,18 @@ vi.mock('../config/config.js');
describe('summarizers', () => {
let mockGeminiClient: GeminiClient;
let MockConfig: Mock;
let mockConfigInstance: Config;
const abortSignal = new AbortController().signal;
const mockResolvedConfig = {
model: 'gemini-pro',
generateContentConfig: {
maxOutputTokens: 2000,
},
} as unknown as ResolvedModelConfig;
beforeEach(() => {
MockConfig = vi.mocked(Config);
const mockConfigInstance = new MockConfig(
mockConfigInstance = new MockConfig(
'test-api-key',
'gemini-pro',
false,
@@ -38,6 +50,9 @@ describe('summarizers', () => {
undefined,
undefined,
);
(mockConfigInstance.modelConfigService as unknown) = {
getResolvedConfig: vi.fn().mockReturnValue(mockResolvedConfig),
} as unknown as ModelConfigService;
mockGeminiClient = new GeminiClient(mockConfigInstance);
(mockGeminiClient.generateContent as Mock) = vi.fn();
@@ -54,10 +69,11 @@ describe('summarizers', () => {
it('should return original text if it is shorter than maxLength', async () => {
const shortText = 'This is a short text.';
const result = await summarizeToolOutput(
mockConfigInstance,
{ model: DEFAULT_GEMINI_MODEL },
shortText,
mockGeminiClient,
abortSignal,
2000,
);
expect(result).toBe(shortText);
expect(mockGeminiClient.generateContent).not.toHaveBeenCalled();
@@ -66,10 +82,11 @@ describe('summarizers', () => {
it('should return original text if it is empty', async () => {
const emptyText = '';
const result = await summarizeToolOutput(
mockConfigInstance,
{ model: DEFAULT_GEMINI_MODEL },
emptyText,
mockGeminiClient,
abortSignal,
2000,
);
expect(result).toBe(emptyText);
expect(mockGeminiClient.generateContent).not.toHaveBeenCalled();
@@ -81,12 +98,12 @@ describe('summarizers', () => {
(mockGeminiClient.generateContent as Mock).mockResolvedValue({
candidates: [{ content: { parts: [{ text: summary }] } }],
});
const result = await summarizeToolOutput(
mockConfigInstance,
{ model: DEFAULT_GEMINI_MODEL },
longText,
mockGeminiClient,
abortSignal,
2000,
);
expect(mockGeminiClient.generateContent).toHaveBeenCalledTimes(1);
@@ -99,10 +116,11 @@ describe('summarizers', () => {
(mockGeminiClient.generateContent as Mock).mockRejectedValue(error);
const result = await summarizeToolOutput(
mockConfigInstance,
{ model: DEFAULT_GEMINI_MODEL },
longText,
mockGeminiClient,
abortSignal,
2000,
);
expect(mockGeminiClient.generateContent).toHaveBeenCalledTimes(1);
@@ -115,8 +133,24 @@ describe('summarizers', () => {
(mockGeminiClient.generateContent as Mock).mockResolvedValue({
candidates: [{ content: { parts: [{ text: summary }] } }],
});
(mockConfigInstance.modelConfigService as unknown) = {
getResolvedConfig() {
return {
model: 'gemini-pro-limited',
generateContentConfig: {
maxOutputTokens: 1000,
},
};
},
};
await summarizeToolOutput(longText, mockGeminiClient, abortSignal, 1000);
await summarizeToolOutput(
mockConfigInstance,
{ model: 'gemini-pro-limited' },
longText,
mockGeminiClient,
abortSignal,
);
const expectedPrompt = `Summarize the following tool output to be a maximum of 1000 tokens. The summary should be concise and capture the main points of the tool output.
@@ -133,7 +167,7 @@ Return the summary string which should first contain an overall summarization of
`;
const calledWith = (mockGeminiClient.generateContent as Mock).mock
.calls[0];
const contents = calledWith[0];
const contents = calledWith[1];
expect(contents[0].parts[0].text).toBe(expectedPrompt);
});
});
@@ -150,6 +184,7 @@ Return the summary string which should first contain an overall summarization of
});
const result = await llmSummarizer(
mockConfigInstance,
toolResult,
mockGeminiClient,
abortSignal,
@@ -171,6 +206,7 @@ Return the summary string which should first contain an overall summarization of
});
const result = await llmSummarizer(
mockConfigInstance,
toolResult,
mockGeminiClient,
abortSignal,
@@ -179,7 +215,7 @@ Return the summary string which should first contain an overall summarization of
expect(mockGeminiClient.generateContent).toHaveBeenCalledTimes(1);
const calledWith = (mockGeminiClient.generateContent as Mock).mock
.calls[0];
const contents = calledWith[0];
const contents = calledWith[1];
expect(contents[0].parts[0].text).toContain(`"${longText}"`);
expect(result).toBe(summary);
});
@@ -193,6 +229,7 @@ Return the summary string which should first contain an overall summarization of
};
const result = await defaultSummarizer(
mockConfigInstance,
toolResult,
mockGeminiClient,
abortSignal,
+21 -15
View File
@@ -5,15 +5,12 @@
*/
import type { ToolResult } from '../tools/tools.js';
import type {
Content,
GenerateContentConfig,
GenerateContentResponse,
} from '@google/genai';
import type { Content } from '@google/genai';
import type { GeminiClient } from '../core/client.js';
import { DEFAULT_GEMINI_FLASH_LITE_MODEL } from '../config/models.js';
import { getResponseText, partToString } from './partUtils.js';
import { debugLogger } from './debugLogger.js';
import type { ModelConfigKey } from '../services/modelConfigService.js';
import type { Config } from '../config/config.js';
/**
* A function that summarizes the result of a tool execution.
@@ -22,6 +19,7 @@ import { debugLogger } from './debugLogger.js';
* @returns The summary of the result.
*/
export type Summarizer = (
config: Config,
result: ToolResult,
geminiClient: GeminiClient,
abortSignal: AbortSignal,
@@ -36,6 +34,7 @@ export type Summarizer = (
* @returns The summary of the result.
*/
export const defaultSummarizer: Summarizer = (
_config: Config,
result: ToolResult,
_geminiClient: GeminiClient,
_abortSignal: AbortSignal,
@@ -55,19 +54,30 @@ Text to summarize:
Return the summary string which should first contain an overall summarization of text followed by the full stack trace of errors and warnings in the tool output.
`;
export const llmSummarizer: Summarizer = (result, geminiClient, abortSignal) =>
export const llmSummarizer: Summarizer = async (
config,
result,
geminiClient,
abortSignal,
) =>
summarizeToolOutput(
config,
{ model: 'summarizer-default' },
partToString(result.llmContent),
geminiClient,
abortSignal,
);
export async function summarizeToolOutput(
config: Config,
modelConfigKey: ModelConfigKey,
textToSummarize: string,
geminiClient: GeminiClient,
abortSignal: AbortSignal,
maxOutputTokens: number = 2000,
): Promise<string> {
const maxOutputTokens =
config.modelConfigService.getResolvedConfig(modelConfigKey)
.generateContentConfig.maxOutputTokens ?? 2000;
// There is going to be a slight difference here since we are comparing length of string with maxOutputTokens.
// This is meant to be a ballpark estimation of if we need to summarize the tool output.
if (!textToSummarize || textToSummarize.length < maxOutputTokens) {
@@ -79,16 +89,12 @@ export async function summarizeToolOutput(
).replace('{textToSummarize}', textToSummarize);
const contents: Content[] = [{ role: 'user', parts: [{ text: prompt }] }];
const toolOutputSummarizerConfig: GenerateContentConfig = {
maxOutputTokens,
};
try {
const parsedResponse = (await geminiClient.generateContent(
const parsedResponse = await geminiClient.generateContent(
modelConfigKey,
contents,
toolOutputSummarizerConfig,
abortSignal,
DEFAULT_GEMINI_FLASH_LITE_MODEL,
)) as unknown as GenerateContentResponse;
);
return getResponseText(parsedResponse) || textToSummarize;
} catch (error) {
debugLogger.warn('Failed to summarize tool output.', error);