feat(research): Introduce research API with provider implementations, docs and tests

2025-09-28 15:06:07 +00:00
parent 5c856ec3ed
commit e2ed429aac
17 changed files with 852 additions and 14 deletions
--- a/ts/00_commitinfo_data.ts
+++ b/ts/00_commitinfo_data.ts
@@ -3,6 +3,6 @@
 */
 export const commitinfo = {
  name: '@push.rocks/smartai',
-  version: '0.5.11',
+  version: '0.6.0',
  description: 'SmartAi is a versatile TypeScript library designed to facilitate integration and interaction with various AI models, offering functionalities for chat, audio generation, document processing, and vision tasks.'
 }
--- a/ts/abstract.classes.multimodal.ts
+++ b/ts/abstract.classes.multimodal.ts
@@ -25,6 +25,31 @@ export interface ChatResponse {
  message: string;
 }

+/**
+ * Options for research interactions
+ */
+export interface ResearchOptions {
+  query: string;
+  searchDepth?: 'basic' | 'advanced' | 'deep';
+  maxSources?: number;
+  includeWebSearch?: boolean;
+  background?: boolean;
+}
+
+/**
+ * Response format for research interactions
+ */
+export interface ResearchResponse {
+  answer: string;
+  sources: Array<{
+    url: string;
+    title: string;
+    snippet: string;
+  }>;
+  searchQueries?: string[];
+  metadata?: any;
+}
+
 /**
 * Abstract base class for multi-modal AI models.
 * Provides a common interface for different AI providers (OpenAI, Anthropic, Perplexity, Ollama)
@@ -98,4 +123,12 @@ export abstract class MultiModalModel {
    pdfDocuments: Uint8Array[];
    messageHistory: ChatMessage[];
  }): Promise<{ message: any }>;
+
+  /**
+   * Research and web search capabilities
+   * @param optionsArg Options containing the research query and configuration
+   * @returns Promise resolving to the research results with sources
+   * @throws Error if the provider doesn't support research capabilities
+   */
+  public abstract research(optionsArg: ResearchOptions): Promise<ResearchResponse>;
 }
--- a/ts/index.ts
+++ b/ts/index.ts
@@ -1,3 +1,9 @@
 export * from './classes.smartai.js';
 export * from './abstract.classes.multimodal.js';
 export * from './provider.openai.js';
+export * from './provider.anthropic.js';
+export * from './provider.perplexity.js';
+export * from './provider.groq.js';
+export * from './provider.ollama.js';
+export * from './provider.xai.js';
+export * from './provider.exo.js';
--- a/ts/provider.anthropic.ts
+++ b/ts/provider.anthropic.ts
@@ -1,13 +1,16 @@
 import * as plugins from './plugins.js';
 import * as paths from './paths.js';
 import { MultiModalModel } from './abstract.classes.multimodal.js';
-import type { ChatOptions, ChatResponse, ChatMessage } from './abstract.classes.multimodal.js';
+import type { ChatOptions, ChatResponse, ChatMessage, ResearchOptions, ResearchResponse } from './abstract.classes.multimodal.js';
 import type { ImageBlockParam, TextBlockParam } from '@anthropic-ai/sdk/resources/messages';

 type ContentBlock = ImageBlockParam | TextBlockParam;

 export interface IAnthropicProviderOptions {
  anthropicToken: string;
+  enableWebSearch?: boolean;
+  searchDomainAllowList?: string[];
+  searchDomainBlockList?: string[];
 }

 export class AnthropicProvider extends MultiModalModel {
@@ -239,4 +242,121 @@ export class AnthropicProvider extends MultiModalModel {
      }
    };
  }
+
+  public async research(optionsArg: ResearchOptions): Promise<ResearchResponse> {
+    // Prepare the messages for the research request
+    const systemMessage = `You are a research assistant with web search capabilities.
+    Provide comprehensive, well-researched answers with citations and sources.
+    When searching the web, be thorough and cite your sources accurately.`;
+
+    try {
+      // Build the tool configuration for web search
+      const tools = this.options.enableWebSearch ? [
+        {
+          type: 'computer_20241022' as const,
+          name: 'web_search',
+          description: 'Search the web for current information',
+          input_schema: {
+            type: 'object' as const,
+            properties: {
+              query: {
+                type: 'string',
+                description: 'The search query'
+              }
+            },
+            required: ['query']
+          }
+        }
+      ] : [];
+
+      // Configure the request based on search depth
+      const maxTokens = optionsArg.searchDepth === 'deep' ? 8192 :
+                        optionsArg.searchDepth === 'advanced' ? 6144 : 4096;
+
+      // Create the research request
+      const requestParams: any = {
+        model: 'claude-3-opus-20240229',
+        system: systemMessage,
+        messages: [
+          {
+            role: 'user' as const,
+            content: optionsArg.query
+          }
+        ],
+        max_tokens: maxTokens,
+        temperature: 0.7
+      };
+
+      // Add tools if web search is enabled
+      if (tools.length > 0) {
+        requestParams.tools = tools;
+        requestParams.tool_choice = { type: 'auto' };
+      }
+
+      // Execute the research request
+      const result = await this.anthropicApiClient.messages.create(requestParams);
+
+      // Extract the answer from content blocks
+      let answer = '';
+      const sources: Array<{ url: string; title: string; snippet: string }> = [];
+      const searchQueries: string[] = [];
+
+      // Process content blocks
+      for (const block of result.content) {
+        if ('text' in block) {
+          answer += block.text;
+        }
+      }
+
+      // Parse sources from the answer (Claude includes citations in various formats)
+      const urlRegex = /\[([^\]]+)\]\(([^)]+)\)/g;
+      let match: RegExpExecArray | null;
+
+      while ((match = urlRegex.exec(answer)) !== null) {
+        sources.push({
+          title: match[1],
+          url: match[2],
+          snippet: ''
+        });
+      }
+
+      // Also look for plain URLs
+      const plainUrlRegex = /https?:\/\/[^\s\)]+/g;
+      const plainUrls = answer.match(plainUrlRegex) || [];
+
+      for (const url of plainUrls) {
+        // Check if this URL is already in sources
+        if (!sources.some(s => s.url === url)) {
+          sources.push({
+            title: new URL(url).hostname,
+            url: url,
+            snippet: ''
+          });
+        }
+      }
+
+      // Extract tool use information if available
+      if ('tool_use' in result && Array.isArray(result.tool_use)) {
+        for (const toolUse of result.tool_use) {
+          if (toolUse.name === 'web_search' && toolUse.input?.query) {
+            searchQueries.push(toolUse.input.query);
+          }
+        }
+      }
+
+      return {
+        answer,
+        sources,
+        searchQueries: searchQueries.length > 0 ? searchQueries : undefined,
+        metadata: {
+          model: 'claude-3-opus-20240229',
+          searchDepth: optionsArg.searchDepth || 'basic',
+          tokensUsed: result.usage?.output_tokens
+        }
+      };
+    } catch (error) {
+      console.error('Anthropic research error:', error);
+      throw new Error(`Failed to perform research: ${error.message}`);
+    }
+  }
 }
--- a/ts/provider.exo.ts
+++ b/ts/provider.exo.ts
@@ -1,7 +1,7 @@
 import * as plugins from './plugins.js';
 import * as paths from './paths.js';
 import { MultiModalModel } from './abstract.classes.multimodal.js';
-import type { ChatOptions, ChatResponse, ChatMessage } from './abstract.classes.multimodal.js';
+import type { ChatOptions, ChatResponse, ChatMessage, ResearchOptions, ResearchResponse } from './abstract.classes.multimodal.js';
 import type { ChatCompletionMessageParam } from 'openai/resources/chat/completions';

 export interface IExoProviderOptions {
@@ -125,4 +125,8 @@ export class ExoProvider extends MultiModalModel {
  }): Promise<{ message: any }> {
    throw new Error('Document processing is not supported by Exo provider');
  }
+
+  public async research(optionsArg: ResearchOptions): Promise<ResearchResponse> {
+    throw new Error('Research capabilities are not yet supported by Exo provider.');
+  }
 }
--- a/ts/provider.groq.ts
+++ b/ts/provider.groq.ts
@@ -1,7 +1,7 @@
 import * as plugins from './plugins.js';
 import * as paths from './paths.js';
 import { MultiModalModel } from './abstract.classes.multimodal.js';
-import type { ChatOptions, ChatResponse, ChatMessage } from './abstract.classes.multimodal.js';
+import type { ChatOptions, ChatResponse, ChatMessage, ResearchOptions, ResearchResponse } from './abstract.classes.multimodal.js';

 export interface IGroqProviderOptions {
  groqToken: string;
@@ -189,4 +189,8 @@ export class GroqProvider extends MultiModalModel {
  }): Promise<{ message: any }> {
    throw new Error('Document processing is not yet supported by Groq.');
  }
+
+  public async research(optionsArg: ResearchOptions): Promise<ResearchResponse> {
+    throw new Error('Research capabilities are not yet supported by Groq provider.');
+  }
 }
--- a/ts/provider.ollama.ts
+++ b/ts/provider.ollama.ts
@@ -1,7 +1,7 @@
 import * as plugins from './plugins.js';
 import * as paths from './paths.js';
 import { MultiModalModel } from './abstract.classes.multimodal.js';
-import type { ChatOptions, ChatResponse, ChatMessage } from './abstract.classes.multimodal.js';
+import type { ChatOptions, ChatResponse, ChatMessage, ResearchOptions, ResearchResponse } from './abstract.classes.multimodal.js';

 export interface IOllamaProviderOptions {
  baseUrl?: string;
@@ -251,4 +251,8 @@ export class OllamaProvider extends MultiModalModel {
      }
    };
  }
+
+  public async research(optionsArg: ResearchOptions): Promise<ResearchResponse> {
+    throw new Error('Research capabilities are not yet supported by Ollama provider.');
+  }
 }
--- a/ts/provider.openai.ts
+++ b/ts/provider.openai.ts
@@ -9,13 +9,15 @@ export type TChatCompletionRequestMessage = {
 };

 import { MultiModalModel } from './abstract.classes.multimodal.js';
+import type { ResearchOptions, ResearchResponse } from './abstract.classes.multimodal.js';

 export interface IOpenaiProviderOptions {
  openaiToken: string;
  chatModel?: string;
  audioModel?: string;
  visionModel?: string;
-  // Optionally add more model options (e.g., documentModel) if needed.
+  researchModel?: string;
+  enableWebSearch?: boolean;
 }

 export class OpenAiProvider extends MultiModalModel {
@@ -229,4 +231,111 @@ export class OpenAiProvider extends MultiModalModel {
    const result = await this.openAiApiClient.chat.completions.create(requestParams);
    return result.choices[0].message.content || '';
  }
+
+  public async research(optionsArg: ResearchOptions): Promise<ResearchResponse> {
+    // Determine which model to use based on search depth
+    let model: string;
+    if (optionsArg.searchDepth === 'deep') {
+      model = this.options.researchModel || 'o4-mini-deep-research-2025-06-26';
+    } else {
+      model = this.options.chatModel || 'gpt-5-mini';
+    }
+
+    // Prepare the request parameters
+    const requestParams: any = {
+      model,
+      messages: [
+        {
+          role: 'system',
+          content: 'You are a research assistant. Provide comprehensive answers with citations and sources when available.'
+        },
+        {
+          role: 'user',
+          content: optionsArg.query
+        }
+      ],
+      temperature: 0.7
+    };
+
+    // Add web search tools if requested
+    if (optionsArg.includeWebSearch || optionsArg.searchDepth === 'deep') {
+      requestParams.tools = [
+        {
+          type: 'function',
+          function: {
+            name: 'web_search',
+            description: 'Search the web for information',
+            parameters: {
+              type: 'object',
+              properties: {
+                query: {
+                  type: 'string',
+                  description: 'The search query'
+                }
+              },
+              required: ['query']
+            }
+          }
+        }
+      ];
+      requestParams.tool_choice = 'auto';
+    }
+
+    // Add background flag for deep research
+    if (optionsArg.background && optionsArg.searchDepth === 'deep') {
+      requestParams.background = true;
+    }
+
+    try {
+      // Execute the research request
+      const result = await this.openAiApiClient.chat.completions.create(requestParams);
+
+      // Extract the answer
+      const answer = result.choices[0].message.content || '';
+
+      // Parse sources from the response (OpenAI often includes URLs in markdown format)
+      const sources: Array<{ url: string; title: string; snippet: string }> = [];
+      const urlRegex = /\[([^\]]+)\]\(([^)]+)\)/g;
+      let match: RegExpExecArray | null;
+
+      while ((match = urlRegex.exec(answer)) !== null) {
+        sources.push({
+          title: match[1],
+          url: match[2],
+          snippet: '' // OpenAI doesn't provide snippets in standard responses
+        });
+      }
+
+      // Extract search queries if tools were used
+      const searchQueries: string[] = [];
+      if (result.choices[0].message.tool_calls) {
+        for (const toolCall of result.choices[0].message.tool_calls) {
+          if ('function' in toolCall && toolCall.function.name === 'web_search') {
+            try {
+              const args = JSON.parse(toolCall.function.arguments);
+              if (args.query) {
+                searchQueries.push(args.query);
+              }
+            } catch (e) {
+              // Ignore parsing errors
+            }
+          }
+        }
+      }
+
+      return {
+        answer,
+        sources,
+        searchQueries: searchQueries.length > 0 ? searchQueries : undefined,
+        metadata: {
+          model,
+          searchDepth: optionsArg.searchDepth || 'basic',
+          tokensUsed: result.usage?.total_tokens
+        }
+      };
+    } catch (error) {
+      console.error('Research API error:', error);
+      throw new Error(`Failed to perform research: ${error.message}`);
+    }
+  }
 }
--- a/ts/provider.perplexity.ts
+++ b/ts/provider.perplexity.ts
@@ -1,7 +1,7 @@
 import * as plugins from './plugins.js';
 import * as paths from './paths.js';
 import { MultiModalModel } from './abstract.classes.multimodal.js';
-import type { ChatOptions, ChatResponse, ChatMessage } from './abstract.classes.multimodal.js';
+import type { ChatOptions, ChatResponse, ChatMessage, ResearchOptions, ResearchResponse } from './abstract.classes.multimodal.js';

 export interface IPerplexityProviderOptions {
  perplexityToken: string;
@@ -168,4 +168,69 @@ export class PerplexityProvider extends MultiModalModel {
  }): Promise<{ message: any }> {
    throw new Error('Document processing is not supported by Perplexity.');
  }
+
+  public async research(optionsArg: ResearchOptions): Promise<ResearchResponse> {
+    // Perplexity has Sonar models that are optimized for search
+    // sonar models: sonar, sonar-pro
+    const model = optionsArg.searchDepth === 'deep' ? 'sonar-pro' : 'sonar';
+
+    try {
+      const response = await fetch('https://api.perplexity.ai/chat/completions', {
+        method: 'POST',
+        headers: {
+          'Authorization': `Bearer ${this.options.perplexityToken}`,
+          'Content-Type': 'application/json',
+        },
+        body: JSON.stringify({
+          model,
+          messages: [
+            {
+              role: 'system',
+              content: 'You are a helpful research assistant. Provide accurate information with sources.'
+            },
+            {
+              role: 'user',
+              content: optionsArg.query
+            }
+          ],
+          temperature: 0.7,
+          max_tokens: 4000
+        }),
+      });
+
+      if (!response.ok) {
+        throw new Error(`Perplexity API error: ${response.statusText}`);
+      }
+
+      const result = await response.json();
+      const answer = result.choices[0].message.content;
+
+      // Parse citations from the response
+      const sources: Array<{ url: string; title: string; snippet: string }> = [];
+
+      // Perplexity includes citations in the format [1], [2], etc. with sources listed
+      // This is a simplified parser - could be enhanced based on actual Perplexity response format
+      if (result.citations) {
+        for (const citation of result.citations) {
+          sources.push({
+            url: citation.url || '',
+            title: citation.title || '',
+            snippet: citation.snippet || ''
+          });
+        }
+      }
+
+      return {
+        answer,
+        sources,
+        metadata: {
+          model,
+          searchDepth: optionsArg.searchDepth || 'basic'
+        }
+      };
+    } catch (error) {
+      console.error('Perplexity research error:', error);
+      throw new Error(`Failed to perform research: ${error.message}`);
+    }
+  }
 }
--- a/ts/provider.xai.ts
+++ b/ts/provider.xai.ts
@@ -1,7 +1,7 @@
 import * as plugins from './plugins.js';
 import * as paths from './paths.js';
 import { MultiModalModel } from './abstract.classes.multimodal.js';
-import type { ChatOptions, ChatResponse, ChatMessage } from './abstract.classes.multimodal.js';
+import type { ChatOptions, ChatResponse, ChatMessage, ResearchOptions, ResearchResponse } from './abstract.classes.multimodal.js';
 import type { ChatCompletionMessageParam } from 'openai/resources/chat/completions';

 export interface IXAIProviderOptions {
@@ -181,4 +181,8 @@ export class XAIProvider extends MultiModalModel {
      message: completion.choices[0]?.message?.content || ''
    };
  }
+
+  public async research(optionsArg: ResearchOptions): Promise<ResearchResponse> {
+    throw new Error('Research capabilities are not yet supported by xAI provider.');
+  }
 }