drivecore
diff --git a/‎packages/agent/src/core/types.ts
Lines changed: 1 addition & 1 deletion b/‎packages/agent/src/core/types.ts
Lines changed: 1 addition & 1 deletion
diff --git a/‎packages/agent/src/tools/session/lib/filterPageContent.test.ts
Lines changed: 123 additions & 0 deletions b/‎packages/agent/src/tools/session/lib/filterPageContent.test.ts
Lines changed: 123 additions & 0 deletions
diff --git a/‎packages/agent/src/tools/session/lib/filterPageContent.ts
Lines changed: 83 additions & 78 deletions b/‎packages/agent/src/tools/session/lib/filterPageContent.ts
Lines changed: 83 additions & 78 deletions
@@ -11,7 +11,7 @@ import { ModelProvider } from './toolAgent/config.js';
 
 export type TokenLevel = 'debug' | 'info' | 'log' | 'warn' | 'error';
 
-export type pageFilter = 'simple' | 'none' | 'readability';
+export type pageFilter = 'raw' | 'smartMarkdown';
 
 export type ToolContext = {
   logger: Logger;
 
@@ -0,0 +1,123 @@
+import { describe, it, expect, vi, beforeEach, afterEach } from 'vitest';
+import { Page } from 'playwright';
+import { filterPageContent } from './filterPageContent';
+import { ToolContext } from '../../../core/types';
+
+// HTML content to use in tests
+const HTML_CONTENT = '<html><body><h1>Test Content</h1></body></html>';
+const MARKDOWN_CONTENT = '# Test Content\n\nThis is the extracted content from the page.';
+
+// Mock the Page object
+const mockPage = {
+  content: vi.fn().mockResolvedValue(HTML_CONTENT),
+  url: vi.fn().mockReturnValue('https://example.com'),
+  evaluate: vi.fn(),
+} as unknown as Page;
+
+// Mock fetch for LLM calls
+global.fetch = vi.fn();
+
+describe('filterPageContent', () => {
+  let mockContext: ToolContext;
+
+  beforeEach(() => {
+    mockContext = {
+      logger: {
+        debug: vi.fn(),
+        log: vi.fn(),
+        warn: vi.fn(),
+        error: vi.fn(),
+        info: vi.fn(),
+      },
+      provider: 'openai',
+      model: 'gpt-4',
+      apiKey: 'test-api-key',
+      baseUrl: 'https://api.openai.com/v1/chat/completions',
+      maxTokens: 4000,
+      temperature: 0.3,
+    } as unknown as ToolContext;
+
+    // Reset mocks
+    vi.resetAllMocks();
+    
+    // Mock the content method to return the HTML_CONTENT
+    mockPage.content.mockResolvedValue(HTML_CONTENT);
+    
+    // Mock fetch to return a successful response
+    (global.fetch as any).mockResolvedValue({
+      ok: true,
+      json: async () => ({
+        choices: [
+          {
+            message: {
+              content: MARKDOWN_CONTENT,
+            },
+          },
+        ],
+      }),
+    });
+  });
+
+  afterEach(() => {
+    vi.clearAllMocks();
+  });
+
+  it('should return raw DOM content with raw filter', async () => {
+    const result = await filterPageContent(mockPage, 'raw', mockContext);
+    
+    expect(mockPage.content).toHaveBeenCalled();
+    expect(result).toEqual(HTML_CONTENT);
+  });
+
+  it('should use LLM to extract content with smartMarkdown filter', async () => {
+    const result = await filterPageContent(mockPage, 'smartMarkdown', mockContext);
+    
+    expect(mockPage.content).toHaveBeenCalled();
+    expect(global.fetch).toHaveBeenCalledWith(
+      'https://api.openai.com/v1/chat/completions',
+      expect.objectContaining({
+        method: 'POST',
+        headers: expect.objectContaining({
+          'Authorization': 'Bearer test-api-key',
+        }),
+        body: expect.any(String),
+      })
+    );
+    
+    // Verify the result is the markdown content from the LLM
+    expect(result).toEqual(MARKDOWN_CONTENT);
+  });
+
+  it('should fall back to raw DOM if LLM call fails', async () => {
+    // Mock fetch to return an error
+    (global.fetch as any).mockResolvedValue({
+      ok: false,
+      text: async () => 'API Error',
+    });
+
+    const result = await filterPageContent(mockPage, 'smartMarkdown', mockContext);
+    
+    expect(mockPage.content).toHaveBeenCalled();
+    expect(mockContext.logger.error).toHaveBeenCalled();
+    expect(result).toEqual(HTML_CONTENT);
+  });
+
+  it('should fall back to raw DOM if context is not provided for smartMarkdown', async () => {
+    // Create a minimal mock context with just a logger to prevent errors
+    const minimalContext = {
+      logger: {
+        debug: vi.fn(),
+        log: vi.fn(),
+        warn: vi.fn(),
+        error: vi.fn(),
+        info: vi.fn(),
+      }
+    } as unknown as ToolContext;
+    
+    const result = await filterPageContent(mockPage, 'smartMarkdown', minimalContext);
+    
+    expect(mockPage.content).toHaveBeenCalled();
+    expect(minimalContext.logger.warn).toHaveBeenCalled();
+    expect(result).toEqual(HTML_CONTENT);
+  });
+});
@@ -1,116 +1,121 @@
 import { Readability } from '@mozilla/readability';
 import { JSDOM } from 'jsdom';
 import { Page } from 'playwright';
+import { ToolContext } from '../../../core/types.js';
 
 const OUTPUT_LIMIT = 11 * 1024; // 10KB limit
 
 /**
  * Returns the raw HTML content of the page without any processing
  */
-async function getNoneProcessedDOM(page: Page): Promise<string> {
-  return await page.content();
+async function getRawDOM(page: Page): Promise<string> {
+  const content = await page.content();
+  return content;
 }
 
 /**
- * Processes the page using Mozilla's Readability to extract the main content
- * Falls back to simple processing if Readability fails
+ * Uses an LLM to extract the main content from a page and format it as markdown
  */
-async function getReadabilityProcessedDOM(page: Page): Promise<string> {
+async function getSmartMarkdownContent(page: Page, context: ToolContext): Promise<string> {
   try {
     const html = await page.content();
     const url = page.url();
-    const dom = new JSDOM(html, { url });
-    const reader = new Readability(dom.window.document);
-    const article = reader.parse();
+    
+    // Create a system prompt for the LLM
+    const systemPrompt = `You are an expert at extracting the main content from web pages.
+Given the HTML content of a webpage, extract only the main informative content.
+Format the extracted content as clean, well-structured markdown.
+Ignore headers, footers, navigation, sidebars, ads, and other non-content elements.
+Preserve the important headings, paragraphs, lists, and other content structures.
+Do not include any explanations or descriptions about what you're doing.
+Just return the extracted content as markdown.`;
 
-    if (!article) {
-      console.warn(
-        'Readability could not parse the page, falling back to simple mode',
-      );
-      return getSimpleProcessedDOM(page);
+    // Use the configured LLM to extract the content
+    const { provider, model, apiKey, baseUrl } = context;
+    
+    if (!provider || !model) {
+      context.logger.warn('LLM provider or model not available, falling back to raw DOM');
+      return getRawDOM(page);
     }
 
-    // Return a formatted version of the article
-    return JSON.stringify(
-      {
-        url: url,
-        title: article.title || '',
-        content: article.content || '',
-        textContent: article.textContent || '',
-        excerpt: article.excerpt || '',
-        byline: article.byline || '',
-        dir: article.dir || '',
-        siteName: article.siteName || '',
-        length: article.length || 0,
-      },
-      null,
-      2,
-    );
+    try {
+      // Import the createProvider function from the provider module
+      const { createProvider } = await import('../../../core/llm/provider.js');
+      
+      // Create a provider instance using the provider abstraction
+      const llmProvider = createProvider(provider, model, {
+        apiKey,
+        baseUrl
+      });
+      
+      // Generate text using the provider
+      const response = await llmProvider.generateText({
+        messages: [
+          {
+            role: 'system',
+            content: systemPrompt
+          },
+          {
+            role: 'user',
+            content: `URL: ${url}\n\nHTML content:\n${html}`
+          }
+        ],
+        temperature: 0.3,
+        maxTokens: 4000
+      });
+      
+      // Extract the markdown content from the response
+      const markdown = response.text;
+      
+      if (!markdown) {
+        context.logger.warn('LLM returned empty content, falling back to raw DOM');
+        return getRawDOM(page);
+      }
+      
+      // Log token usage for monitoring
+      context.logger.debug(`Token usage for content extraction: ${JSON.stringify(response.tokenUsage)}`);
+      
+      return markdown;
+    } catch (llmError) {
+      context.logger.error('Error using LLM provider for content extraction:', llmError);
+      return getRawDOM(page);
+    }
   } catch (error) {
-    console.error('Error using Readability:', error);
-    // Fallback to simple mode if Readability fails
-    return getSimpleProcessedDOM(page);
+    context.logger.error('Error using LLM for content extraction:', error);
+    // Fallback to raw mode if LLM processing fails
+    return getRawDOM(page);
   }
 }
 
-/**
- * Processes the page by removing invisible elements and non-visual tags
- */
-async function getSimpleProcessedDOM(page: Page): Promise<string> {
-  const domContent = await page.evaluate(() => {
-    const clone = document.documentElement;
-
-    const elements = clone.querySelectorAll('*');
-
-    const elementsToRemove: Element[] = [];
-    elements.forEach((element) => {
-      const computedStyle = window.getComputedStyle(element);
-      const isVisible =
-        computedStyle.display !== 'none' &&
-        computedStyle.visibility !== 'hidden' &&
-        computedStyle.opacity !== '0';
-
-      if (!isVisible) {
-        elementsToRemove.push(element);
-      }
-    });
-
-    const nonVisualTags = clone.querySelectorAll(
-      'noscript, iframe, link[rel="stylesheet"], meta, svg, img, symbol, path, style, script',
-    );
-    nonVisualTags.forEach((element) => elementsToRemove.push(element));
-
-    elementsToRemove.forEach((element) => element.remove());
-
-    return clone.outerHTML;
-  });
-
-  return domContent.replace(/\n/g, '').replace(/\s+/g, ' ');
-}
-
 /**
  * Gets the rendered DOM of a page with specified processing method
  */
 export async function filterPageContent(
   page: Page,
-  pageFilter: 'simple' | 'none' | 'readability',
+  pageFilter: 'raw' | 'smartMarkdown',
+  context?: ToolContext
 ): Promise<string> {
   let result: string = '';
+  
   switch (pageFilter) {
-    case 'none':
-      result = await getNoneProcessedDOM(page);
-      break;
-    case 'readability':
-      result = await getReadabilityProcessedDOM(page);
+    case 'smartMarkdown':
+      if (!context) {
+        console.warn('ToolContext required for smartMarkdown filter but not provided, falling back to raw mode');
+        result = await getRawDOM(page);
+      } else {
+        result = await getSmartMarkdownContent(page, context);
+      }
       break;
-    case 'simple':
+    case 'raw':
     default:
-      result = await getSimpleProcessedDOM(page);
+      result = await getRawDOM(page);
       break;
   }
 
-  if (result.length > OUTPUT_LIMIT) {
-    return result.slice(0, OUTPUT_LIMIT) + '...(truncated)';
+  // Ensure result is a string before checking length
+  const resultString = result || '';
+  if (resultString.length > OUTPUT_LIMIT) {
+    return resultString.slice(0, OUTPUT_LIMIT) + '...(truncated)';
   }
-  return result;
+  return resultString;
 }