fix(web-fetch): respect Content-Type header in fallback mechanism (#11284)

2026-05-03 08:24:10 -07:00 · 2025-10-16 14:16:24 -04:00
parent ffa547ce8d
commit 05930d5e25
2 changed files with 138 additions and 8 deletions
@@ -22,12 +22,17 @@ import {
  logWebFetchFallbackAttempt,
  WebFetchFallbackAttemptEvent,
 } from '../telemetry/index.js';
+import { convert } from 'html-to-text';

 const mockGenerateContent = vi.fn();
 const mockGetGeminiClient = vi.fn(() => ({
  generateContent: mockGenerateContent,
 }));

+vi.mock('html-to-text', () => ({
+  convert: vi.fn((text) => `Converted: ${text}`),
+}));
+
 vi.mock('../telemetry/index.js', () => ({
  logWebFetchFallbackAttempt: vi.fn(),
  WebFetchFallbackAttemptEvent: vi.fn(),
@@ -246,6 +251,116 @@ describe('WebFetchTool', () => {
    });
  });

+  describe('execute (fallback)', () => {
+    beforeEach(() => {
+      // Force fallback by mocking primary fetch to fail
+      vi.spyOn(fetchUtils, 'isPrivateIp').mockReturnValue(false);
+      mockGenerateContent.mockResolvedValueOnce({
+        candidates: [],
+      });
+    });
+
+    it('should convert HTML content using html-to-text', async () => {
+      const htmlContent = '<html><body><h1>Hello</h1></body></html>';
+      vi.spyOn(fetchUtils, 'fetchWithTimeout').mockResolvedValue({
+        ok: true,
+        headers: new Headers({ 'content-type': 'text/html; charset=utf-8' }),
+        text: () => Promise.resolve(htmlContent),
+      } as Response);
+
+      // Mock fallback LLM call to return the content passed to it
+      mockGenerateContent.mockImplementationOnce(async (req) => ({
+        candidates: [{ content: { parts: [{ text: req[0].parts[0].text }] } }],
+      }));
+
+      const tool = new WebFetchTool(mockConfig);
+      const params = { prompt: 'fetch https://example.com' };
+      const invocation = tool.build(params);
+      const result = await invocation.execute(new AbortController().signal);
+
+      expect(convert).toHaveBeenCalledWith(htmlContent, {
+        wordwrap: false,
+        selectors: [
+          { selector: 'a', options: { ignoreHref: true } },
+          { selector: 'img', format: 'skip' },
+        ],
+      });
+      expect(result.llmContent).toContain(`Converted: ${htmlContent}`);
+    });
+
+    it('should return raw text for JSON content', async () => {
+      const jsonContent = '{"key": "value"}';
+      vi.spyOn(fetchUtils, 'fetchWithTimeout').mockResolvedValue({
+        ok: true,
+        headers: new Headers({ 'content-type': 'application/json' }),
+        text: () => Promise.resolve(jsonContent),
+      } as Response);
+
+      // Mock fallback LLM call to return the content passed to it
+      mockGenerateContent.mockImplementationOnce(async (req) => ({
+        candidates: [{ content: { parts: [{ text: req[0].parts[0].text }] } }],
+      }));
+
+      const tool = new WebFetchTool(mockConfig);
+      const params = { prompt: 'fetch https://example.com' };
+      const invocation = tool.build(params);
+      const result = await invocation.execute(new AbortController().signal);
+
+      expect(convert).not.toHaveBeenCalled();
+      expect(result.llmContent).toContain(jsonContent);
+    });
+
+    it('should return raw text for plain text content', async () => {
+      const textContent = 'Just some text.';
+      vi.spyOn(fetchUtils, 'fetchWithTimeout').mockResolvedValue({
+        ok: true,
+        headers: new Headers({ 'content-type': 'text/plain' }),
+        text: () => Promise.resolve(textContent),
+      } as Response);
+
+      // Mock fallback LLM call to return the content passed to it
+      mockGenerateContent.mockImplementationOnce(async (req) => ({
+        candidates: [{ content: { parts: [{ text: req[0].parts[0].text }] } }],
+      }));
+
+      const tool = new WebFetchTool(mockConfig);
+      const params = { prompt: 'fetch https://example.com' };
+      const invocation = tool.build(params);
+      const result = await invocation.execute(new AbortController().signal);
+
+      expect(convert).not.toHaveBeenCalled();
+      expect(result.llmContent).toContain(textContent);
+    });
+
+    it('should treat content with no Content-Type header as HTML', async () => {
+      const content = '<p>No header</p>';
+      vi.spyOn(fetchUtils, 'fetchWithTimeout').mockResolvedValue({
+        ok: true,
+        headers: new Headers(),
+        text: () => Promise.resolve(content),
+      } as Response);
+
+      // Mock fallback LLM call to return the content passed to it
+      mockGenerateContent.mockImplementationOnce(async (req) => ({
+        candidates: [{ content: { parts: [{ text: req[0].parts[0].text }] } }],
+      }));
+
+      const tool = new WebFetchTool(mockConfig);
+      const params = { prompt: 'fetch https://example.com' };
+      const invocation = tool.build(params);
+      const result = await invocation.execute(new AbortController().signal);
+
+      expect(convert).toHaveBeenCalledWith(content, {
+        wordwrap: false,
+        selectors: [
+          { selector: 'a', options: { ignoreHref: true } },
+          { selector: 'img', format: 'skip' },
+        ],
+      });
+      expect(result.llmContent).toContain(`Converted: ${content}`);
+    });
+  });
+
  describe('shouldConfirmExecute', () => {
    it('should return confirmation details with the correct prompt and parsed urls', async () => {
      const tool = new WebFetchTool(mockConfig);
@@ -133,14 +133,29 @@ class WebFetchToolInvocation extends BaseToolInvocation<
          `Request failed with status code ${response.status} ${response.statusText}`,
        );
      }
-      const html = await response.text();
-      const textContent = convert(html, {
-        wordwrap: false,
-        selectors: [
-          { selector: 'a', options: { ignoreHref: true } },
-          { selector: 'img', format: 'skip' },
-        ],
-      }).substring(0, MAX_CONTENT_LENGTH);
+
+      const rawContent = await response.text();
+      const contentType = response.headers.get('content-type') || '';
+      let textContent: string;
+
+      // Only use html-to-text if content type is HTML, or if no content type is provided (assume HTML)
+      if (
+        contentType.toLowerCase().includes('text/html') ||
+        contentType === ''
+      ) {
+        textContent = convert(rawContent, {
+          wordwrap: false,
+          selectors: [
+            { selector: 'a', options: { ignoreHref: true } },
+            { selector: 'img', format: 'skip' },
+          ],
+        });
+      } else {
+        // For other content types (text/plain, application/json, etc.), use raw text
+        textContent = rawContent;
+      }
+
+      textContent = textContent.substring(0, MAX_CONTENT_LENGTH);

      const geminiClient = this.config.getGeminiClient();
      const fallbackPrompt = `The user requested the following: "${this.params.prompt}".