feat(core): Unified Context Management and Tool Distillation. (#24157)

This commit is contained in:
joshualitt
2026-03-30 15:29:59 -07:00
committed by GitHub
parent 117a2d3844
commit dfba0e91e2
22 changed files with 1717 additions and 314 deletions

View File

@@ -293,6 +293,7 @@ describe('WebFetchTool', () => {
})),
},
isInteractive: () => false,
isAutoDistillationEnabled: vi.fn().mockReturnValue(false),
} as unknown as Config;
});
@@ -1118,5 +1119,40 @@ describe('WebFetchTool', () => {
);
expect(result.error?.type).toBe(ToolErrorType.WEB_FETCH_PROCESSING_ERROR);
});
it('should bypass truncation if isAutoDistillationEnabled is true', async () => {
vi.spyOn(mockConfig, 'isAutoDistillationEnabled').mockReturnValue(true);
const largeContent = 'a'.repeat(300000); // Larger than MAX_CONTENT_LENGTH (250000)
mockFetch('https://example.com/large-text', {
status: 200,
headers: new Headers({ 'content-type': 'text/plain' }),
text: () => Promise.resolve(largeContent),
});
const tool = new WebFetchTool(mockConfig, bus);
const invocation = tool.build({ url: 'https://example.com/large-text' });
const result = await invocation.execute(new AbortController().signal);
expect((result.llmContent as string).length).toBe(300000); // No truncation
});
it('should truncate if isAutoDistillationEnabled is false', async () => {
vi.spyOn(mockConfig, 'isAutoDistillationEnabled').mockReturnValue(false);
const largeContent = 'a'.repeat(300000); // Larger than MAX_CONTENT_LENGTH (250000)
mockFetch('https://example.com/large-text2', {
status: 200,
headers: new Headers({ 'content-type': 'text/plain' }),
text: () => Promise.resolve(largeContent),
});
const tool = new WebFetchTool(mockConfig, bus);
const invocation = tool.build({ url: 'https://example.com/large-text2' });
const result = await invocation.execute(new AbortController().signal);
expect((result.llmContent as string).length).toBeLessThan(300000);
expect(result.llmContent).toContain(
'[Content truncated due to size limit]',
);
});
});
});

View File

@@ -338,9 +338,15 @@ class WebFetchToolInvocation extends BaseToolInvocation<
textContent = rawContent;
}
// Cap at MAX_CONTENT_LENGTH initially to avoid excessive memory usage
// before the global budget allocation.
return truncateString(textContent, MAX_CONTENT_LENGTH, '');
if (!this.context.config.isAutoDistillationEnabled()) {
return truncateString(
textContent,
MAX_CONTENT_LENGTH,
TRUNCATION_WARNING,
);
}
return textContent;
}
private filterAndValidateUrls(urls: string[]): {
@@ -406,28 +412,32 @@ class WebFetchToolInvocation extends BaseToolInvocation<
};
}
// Smart Budget Allocation (Water-filling algorithm) for successes
const sortedSuccesses = [...successes].sort(
(a, b) => a.content.length - b.content.length,
);
let remainingBudget = MAX_CONTENT_LENGTH;
let remainingUrls = sortedSuccesses.length;
const finalContentsByUrl = new Map<string, string>();
for (const success of sortedSuccesses) {
const fairShare = Math.floor(remainingBudget / remainingUrls);
const allocated = Math.min(success.content.length, fairShare);
const truncated = truncateString(
success.content,
allocated,
TRUNCATION_WARNING,
if (this.context.config.isAutoDistillationEnabled()) {
successes.forEach((success) =>
finalContentsByUrl.set(success.url, success.content),
);
} else {
// Smart Budget Allocation (Water-filling algorithm) for successes
const sortedSuccesses = [...successes].sort(
(a, b) => a.content.length - b.content.length,
);
let remainingBudget = MAX_CONTENT_LENGTH;
let remainingUrls = sortedSuccesses.length;
for (const success of sortedSuccesses) {
const fairShare = Math.floor(remainingBudget / remainingUrls);
const allocated = Math.min(success.content.length, fairShare);
finalContentsByUrl.set(success.url, truncated);
remainingBudget -= truncated.length;
remainingUrls--;
const truncated = truncateString(
success.content,
allocated,
TRUNCATION_WARNING,
);
finalContentsByUrl.set(success.url, truncated);
remainingBudget -= truncated.length;
remainingUrls--;
}
}
const aggregatedContent = uniqueUrls
@@ -648,14 +658,21 @@ ${aggregatedContent}
);
if (status >= 400) {
const rawResponseText = bodyBuffer.toString('utf8');
let rawResponseText = bodyBuffer.toString('utf8');
if (!this.context.config.isAutoDistillationEnabled()) {
rawResponseText = truncateString(
rawResponseText,
10000,
'\n\n... [Error response truncated] ...',
);
}
const headers: Record<string, string> = {};
response.headers.forEach((value, key) => {
headers[key] = value;
});
const errorContent = `Request failed with status ${status}
Headers: ${JSON.stringify(headers, null, 2)}
Response: ${truncateString(rawResponseText, 10000, '\n\n... [Error response truncated] ...')}`;
Response: ${rawResponseText}`;
debugLogger.error(
`[WebFetchTool] Experimental fetch failed with status ${status} for ${url}`,
);
@@ -671,11 +688,10 @@ Response: ${truncateString(rawResponseText, 10000, '\n\n... [Error response trun
lowContentType.includes('text/plain') ||
lowContentType.includes('application/json')
) {
const text = truncateString(
bodyBuffer.toString('utf8'),
MAX_CONTENT_LENGTH,
TRUNCATION_WARNING,
);
let text = bodyBuffer.toString('utf8');
if (!this.context.config.isAutoDistillationEnabled()) {
text = truncateString(text, MAX_CONTENT_LENGTH, TRUNCATION_WARNING);
}
return {
llmContent: text,
returnDisplay: `Fetched ${contentType} content from ${url}`,
@@ -684,16 +700,19 @@ Response: ${truncateString(rawResponseText, 10000, '\n\n... [Error response trun
if (lowContentType.includes('text/html')) {
const html = bodyBuffer.toString('utf8');
const textContent = truncateString(
convert(html, {
wordwrap: false,
selectors: [
{ selector: 'a', options: { ignoreHref: false, baseUrl: url } },
],
}),
MAX_CONTENT_LENGTH,
TRUNCATION_WARNING,
);
let textContent = convert(html, {
wordwrap: false,
selectors: [
{ selector: 'a', options: { ignoreHref: false, baseUrl: url } },
],
});
if (!this.context.config.isAutoDistillationEnabled()) {
textContent = truncateString(
textContent,
MAX_CONTENT_LENGTH,
TRUNCATION_WARNING,
);
}
return {
llmContent: textContent,
returnDisplay: `Fetched and converted HTML content from ${url}`,
@@ -718,11 +737,10 @@ Response: ${truncateString(rawResponseText, 10000, '\n\n... [Error response trun
}
// Fallback for unknown types - try as text
const text = truncateString(
bodyBuffer.toString('utf8'),
MAX_CONTENT_LENGTH,
TRUNCATION_WARNING,
);
let text = bodyBuffer.toString('utf8');
if (!this.context.config.isAutoDistillationEnabled()) {
text = truncateString(text, MAX_CONTENT_LENGTH, TRUNCATION_WARNING);
}
return {
llmContent: text,
returnDisplay: `Fetched ${contentType || 'unknown'} content from ${url}`,