jaworldwideorg
diff --git a/‎packages/prompts/src/prompts/index.ts‎
Lines changed: 1 addition & 0 deletions b/‎packages/prompts/src/prompts/index.ts‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎packages/prompts/src/prompts/search/crawlResults.test.ts‎
Lines changed: 172 additions & 0 deletions b/‎packages/prompts/src/prompts/search/crawlResults.test.ts‎
Lines changed: 172 additions & 0 deletions
diff --git a/‎packages/prompts/src/prompts/search/crawlResults.ts‎
Lines changed: 82 additions & 0 deletions b/‎packages/prompts/src/prompts/search/crawlResults.ts‎
Lines changed: 82 additions & 0 deletions
diff --git a/‎packages/prompts/src/prompts/search/index.ts‎
Lines changed: 2 additions & 0 deletions b/‎packages/prompts/src/prompts/search/index.ts‎
Lines changed: 2 additions & 0 deletions
@@ -2,4 +2,5 @@ export * from './chatMessages';
 export * from './files';
 export * from './knowledgeBaseQA';
 export * from './plugin';
+export * from './search';
 export * from './systemRole';
@@ -0,0 +1,172 @@
+import { describe, expect, it } from 'vitest';
+
+import { crawlResultsPrompt } from './crawlResults';
+
+describe('crawlResultsPrompt', () => {
+  it('should return empty XML for empty results', () => {
+    const result = crawlResultsPrompt([]);
+    expect(result).toBe('<no_crawl_results />');
+  });
+
+  it('should convert basic crawl result to compact XML format', () => {
+    const results = [
+      {
+        url: 'https://example.com',
+        title: 'Example Page',
+        content: 'Page content here',
+      },
+    ];
+
+    const xml = crawlResultsPrompt(results);
+
+    expect(xml).toEqual(`<crawlResults>
+  <page url="https://example.com" title="Example Page">Page content here</page>
+</crawlResults>`);
+  });
+
+  it('should include all optional metadata fields', () => {
+    const results = [
+      {
+        url: 'http://arxiv.org/abs/2509.09734v1',
+        title: 'MCP-AgentBench: Evaluating Real-World Language Agent Performance',
+        contentType: 'text' as const,
+        description: 'Abstract page for arXiv paper 2509.09734v1',
+        length: 10187,
+        content: 'Full paper content...',
+      },
+    ];
+
+    const xml = crawlResultsPrompt(results);
+
+    expect(xml).toEqual(`<crawlResults>
+  <page url="http://arxiv.org/abs/2509.09734v1" title="MCP-AgentBench: Evaluating Real-World Language Agent Performance" contentType="text" description="Abstract page for arXiv paper 2509.09734v1" length="10187">Full paper content...</page>
+</crawlResults>`);
+  });
+
+  it('should handle page without content', () => {
+    const results = [
+      {
+        url: 'https://example.com',
+        title: 'Empty Page',
+        contentType: 'text' as const,
+      },
+    ];
+
+    const xml = crawlResultsPrompt(results);
+
+    expect(xml).toEqual(`<crawlResults>
+  <page url="https://example.com" title="Empty Page" contentType="text" />
+</crawlResults>`);
+  });
+
+  it('should handle error items', () => {
+    const results = [
+      {
+        errorType: 'NetworkError',
+        errorMessage: 'Failed to fetch the page',
+        url: 'https://failed.com',
+      },
+    ];
+
+    const xml = crawlResultsPrompt(results);
+
+    expect(xml).toEqual(`<crawlResults>
+  <error errorType="NetworkError" errorMessage="Failed to fetch the page" url="https://failed.com" />
+</crawlResults>`);
+  });
+
+  it('should escape XML special characters in attributes', () => {
+    const results = [
+      {
+        url: 'https://example.com?foo=bar&baz=qux',
+        title: 'Title with <tags> & "quotes"',
+        description: 'Description with special chars & <html>',
+      },
+    ];
+
+    const xml = crawlResultsPrompt(results);
+
+    expect(xml).toEqual(`<crawlResults>
+  <page url="https://example.com?foo=bar&amp;baz=qux" title="Title with &lt;tags&gt; &amp; &quot;quotes&quot;" description="Description with special chars &amp; &lt;html&gt;" />
+</crawlResults>`);
+  });
+
+  it('should escape XML special characters in content', () => {
+    const results = [
+      {
+        url: 'https://example.com',
+        title: 'Test',
+        content: 'Content with <html> tags & special chars',
+      },
+    ];
+
+    const xml = crawlResultsPrompt(results);
+
+    expect(xml).toEqual(`<crawlResults>
+  <page url="https://example.com" title="Test">Content with &lt;html&gt; tags &amp; special chars</page>
+</crawlResults>`);
+  });
+
+  it('should handle multiple pages with mixed success and errors', () => {
+    const results = [
+      {
+        url: 'https://success1.com',
+        title: 'First Page',
+        content: 'First content',
+      },
+      {
+        errorType: 'TimeoutError',
+        errorMessage: 'Request timeout',
+        url: 'https://failed.com',
+      },
+      {
+        url: 'https://success2.com',
+        title: 'Second Page',
+        content: 'Second content',
+      },
+    ];
+
+    const xml = crawlResultsPrompt(results);
+
+    expect(xml).toEqual(`<crawlResults>
+  <page url="https://success1.com" title="First Page">First content</page>
+  <error errorType="TimeoutError" errorMessage="Request timeout" url="https://failed.com" />
+  <page url="https://success2.com" title="Second Page">Second content</page>
+</crawlResults>`);
+  });
+
+  it('should handle error without url', () => {
+    const results = [
+      {
+        errorType: 'UnknownError',
+        errorMessage: 'Unknown error occurred',
+      },
+    ];
+
+    const xml = crawlResultsPrompt(results);
+
+    expect(xml).toEqual(`<crawlResults>
+  <error errorType="UnknownError" errorMessage="Unknown error occurred" />
+</crawlResults>`);
+  });
+
+  it('should handle real arXiv example', () => {
+    const results = [
+      {
+        url: 'http://arxiv.org/abs/2508.01780v1',
+        title: 'LiveMCPBench: Can Agents Navigate an Ocean of MCP Tools?',
+        contentType: 'text' as const,
+        description: 'Abstract page for arXiv paper 2508.01780v1',
+        length: 10512,
+        content:
+          'With the rapid development of Model Context Protocol (MCP), the number of MCP servers has surpassed 10,000...',
+      },
+    ];
+
+    const xml = crawlResultsPrompt(results);
+
+    expect(xml).toEqual(`<crawlResults>
+  <page url="http://arxiv.org/abs/2508.01780v1" title="LiveMCPBench: Can Agents Navigate an Ocean of MCP Tools?" contentType="text" description="Abstract page for arXiv paper 2508.01780v1" length="10512">With the rapid development of Model Context Protocol (MCP), the number of MCP servers has surpassed 10,000...</page>
+</crawlResults>`);
+  });
+});
@@ -0,0 +1,82 @@
+import { escapeXmlAttr, escapeXmlContent } from './xmlEscape';
+
+export interface CrawlResultItem {
+  content?: string;
+  contentType?: 'text' | 'json';
+  description?: string;
+  length?: number;
+  siteName?: string;
+  title?: string;
+  url: string;
+}
+
+export interface CrawlErrorItem {
+  content?: string;
+  errorMessage: string;
+  errorType: string;
+  url?: string;
+}
+
+/**
+ * Convert crawl results array to compact XML format for token efficiency
+ * Uses attributes for metadata and element content for main text
+ *
+ * @example
+ * ```typescript
+ * const results = [
+ *   { title: "Page Title", url: "https://example.com", content: "..." }
+ * ];
+ * const xml = crawlResultsPrompt(results);
+ * // Output:
+ * // <crawlResults>
+ * //   <page title="Page Title" url="https://example.com">...</page>
+ * // </crawlResults>
+ * ```
+ */
+export const crawlResultsPrompt = (results: Array<CrawlResultItem | CrawlErrorItem>): string => {
+  if (results.length === 0) return '<no_crawl_results />';
+
+  const items = results
+    .map((item) => {
+      // Handle error items
+      if ('errorMessage' in item) {
+        const attrs: string[] = [
+          `errorType="${escapeXmlAttr(item.errorType)}"`,
+          `errorMessage="${escapeXmlAttr(item.errorMessage)}"`,
+        ];
+
+        if (item.url) {
+          attrs.push(`url="${escapeXmlAttr(item.url)}"`);
+        }
+
+        return `  <error ${attrs.join(' ')} />`;
+      }
+
+      // Handle successful crawl items
+      const attrs: string[] = [`url="${escapeXmlAttr(item.url)}"`];
+
+      if (item.title) {
+        attrs.push(`title="${escapeXmlAttr(item.title)}"`);
+      }
+
+      if (item.contentType) {
+        attrs.push(`contentType="${escapeXmlAttr(item.contentType)}"`);
+      }
+
+      if (item.description) {
+        attrs.push(`description="${escapeXmlAttr(item.description)}"`);
+      }
+
+      if (item.length !== undefined) {
+        attrs.push(`length="${item.length}"`);
+      }
+
+      const attrString = attrs.join(' ');
+      const content = item.content ? escapeXmlContent(item.content) : '';
+
+      return content ? `  <page ${attrString}>${content}</page>` : `  <page ${attrString} />`;
+    })
+    .join('\n');
+
+  return `<crawlResults>\n${items}\n</crawlResults>`;
+};
@@ -0,0 +1,2 @@
+export * from './crawlResults';
+export * from './searchResults';
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,2 @@`
	`1`	`+export * from './crawlResults';`
	`2`	`+export * from './searchResults';`