v0.12.0

feat(ollama): add support for base64-encoded images in chat messages and forward them to the Ollama provider
v0.11.1
2026-01-20 01:10:27 +00:00 · 2026-01-20 01:10:27 +00:00 · 2026-01-20 00:37:59 +00:00 · 2026-01-20 00:37:49 +00:00 · 2026-01-20 00:12:21 +00:00 · 2026-01-20 00:12:21 +00:00
6 changed files with 151 additions and 10 deletions
--- a/changelog.md
+++ b/changelog.md
@@ -1,5 +1,20 @@
 # Changelog

+## 2026-01-20 - 0.12.0 - feat(ollama)
+add support for base64-encoded images in chat messages and forward them to the Ollama provider
+
+- Add optional images?: string[] to ChatMessage and ChatOptions interfaces (multimodal/vision support)
+- Propagate images from messageHistory and ChatOptions to the Ollama API payload in chat, chatStreaming, and streaming handlers
+- Changes are non-breaking: images are optional and existing behavior is preserved when absent
+
+## 2026-01-20 - 0.11.0 - feat(ollama)
+support defaultOptions and defaultTimeout for ollama provider
+
+- Added ollama.defaultOptions object with fields: num_ctx, temperature, top_k, top_p, repeat_penalty, num_predict, stop, seed
+- Added ollama.defaultTimeout option
+- Pass defaultOptions and defaultTimeout into OllamaProvider constructor when initializing the provider
+- Non-breaking change: existing behavior preserved if new fields are undefined
+
 ## 2026-01-20 - 0.10.1 - fix()
 no changes detected — no release necessary

--- a/package.json
+++ b/package.json
@@ -1,6 +1,6 @@
 {
  "name": "@push.rocks/smartai",
-  "version": "0.10.1",
+  "version": "0.12.0",
  "private": false,
  "description": "SmartAi is a versatile TypeScript library designed to facilitate integration and interaction with various AI models, offering functionalities for chat, audio generation, document processing, and vision tasks.",
  "main": "dist_ts/index.js",
--- a/ts/00_commitinfo_data.ts
+++ b/ts/00_commitinfo_data.ts
@@ -3,6 +3,6 @@
 */
 export const commitinfo = {
  name: '@push.rocks/smartai',
-  version: '0.10.1',
+  version: '0.12.0',
  description: 'SmartAi is a versatile TypeScript library designed to facilitate integration and interaction with various AI models, offering functionalities for chat, audio generation, document processing, and vision tasks.'
 }
--- a/ts/abstract.classes.multimodal.ts
+++ b/ts/abstract.classes.multimodal.ts
@@ -6,6 +6,8 @@ import * as plugins from './plugins.js';
 export interface ChatMessage {
  role: 'assistant' | 'user' | 'system';
  content: string;
+  /** Base64-encoded images for vision-capable models */
+  images?: string[];
 }

 /**
@@ -15,6 +17,16 @@ export interface ChatOptions {
  systemMessage: string;
  userMessage: string;
  messageHistory: ChatMessage[];
+  /** Base64-encoded images for the current message (vision-capable models) */
+  images?: string[];
+}
+
+/**
+ * Options for streaming chat interactions
+ */
+export interface StreamingChatOptions extends ChatOptions {
+  /** Callback fired for each token during generation */
+  onToken?: (token: string) => void;
 }

 /**
@@ -161,6 +173,14 @@ export abstract class MultiModalModel {
   */
  public abstract chatStream(input: ReadableStream<Uint8Array>): Promise<ReadableStream<string>>;

+  /**
+   * Streaming chat with token callback
+   * Calls onToken for each token generated, returns final response
+   * @param optionsArg Options containing system message, user message, message history, and onToken callback
+   * @returns Promise resolving to the assistant's response
+   */
+  public chatStreaming?(optionsArg: StreamingChatOptions): Promise<ChatResponse>;
+
  /**
   * Text-to-speech conversion
   * @param optionsArg Options containing the message to convert to speech
--- a/ts/classes.smartai.ts
+++ b/ts/classes.smartai.ts
@@ -32,6 +32,17 @@ export interface ISmartAiOptions {
    baseUrl?: string;
    model?: string;
    visionModel?: string;
+    defaultOptions?: {
+      num_ctx?: number;
+      temperature?: number;
+      top_k?: number;
+      top_p?: number;
+      repeat_penalty?: number;
+      num_predict?: number;
+      stop?: string[];
+      seed?: number;
+    };
+    defaultTimeout?: number;
  };
  elevenlabs?: {
    defaultVoiceId?: string;
@@ -111,6 +122,8 @@ export class SmartAi {
        baseUrl: this.options.ollama.baseUrl,
        model: this.options.ollama.model,
        visionModel: this.options.ollama.visionModel,
+        defaultOptions: this.options.ollama.defaultOptions,
+        defaultTimeout: this.options.ollama.defaultTimeout,
      });
      await this.ollamaProvider.start();
    }
--- a/ts/provider.ollama.ts
+++ b/ts/provider.ollama.ts
@@ -9,7 +9,8 @@ import type {
  ResearchResponse,
  ImageGenerateOptions,
  ImageEditOptions,
-  ImageResponse
+  ImageResponse,
+  StreamingChatOptions
 } from './abstract.classes.multimodal.js';

 /**
@@ -42,6 +43,7 @@ export interface IOllamaChatOptions extends ChatOptions {
  options?: IOllamaModelOptions;  // Per-request model options
  timeout?: number;               // Per-request timeout in ms
  model?: string;                 // Per-request model override
+  // images is inherited from ChatOptions
 }

 /**
@@ -202,10 +204,30 @@ export class OllamaProvider extends MultiModalModel {
  // Implementing the synchronous chat interaction
  public async chat(optionsArg: ChatOptions): Promise<ChatResponse> {
    // Format messages for Ollama
+    const historyMessages = optionsArg.messageHistory.map((msg) => {
+      const formatted: { role: string; content: string; images?: string[] } = {
+        role: msg.role,
+        content: msg.content,
+      };
+      if (msg.images && msg.images.length > 0) {
+        formatted.images = msg.images;
+      }
+      return formatted;
+    });
+
+    // Build user message with optional images
+    const userMessage: { role: string; content: string; images?: string[] } = {
+      role: 'user',
+      content: optionsArg.userMessage,
+    };
+    if (optionsArg.images && optionsArg.images.length > 0) {
+      userMessage.images = optionsArg.images;
+    }
+
    const messages = [
      { role: 'system', content: optionsArg.systemMessage },
-      ...optionsArg.messageHistory,
-      { role: 'user', content: optionsArg.userMessage }
+      ...historyMessages,
+      userMessage,
    ];

    // Make API call to Ollama with defaultOptions and timeout
@@ -235,6 +257,35 @@ export class OllamaProvider extends MultiModalModel {
    };
  }

+  /**
+   * Streaming chat with token callback (implements MultiModalModel interface)
+   * Calls onToken for each token generated during the response
+   */
+  public async chatStreaming(optionsArg: StreamingChatOptions): Promise<ChatResponse> {
+    const onToken = optionsArg.onToken;
+
+    // Use existing collectStreamResponse with callback, including images
+    const response = await this.collectStreamResponse(
+      {
+        systemMessage: optionsArg.systemMessage,
+        userMessage: optionsArg.userMessage,
+        messageHistory: optionsArg.messageHistory,
+        images: optionsArg.images,
+      },
+      (chunk) => {
+        if (onToken) {
+          if (chunk.thinking) onToken(chunk.thinking);
+          if (chunk.content) onToken(chunk.content);
+        }
+      }
+    );
+
+    return {
+      role: 'assistant' as const,
+      message: response.message,
+    };
+  }
+
  /**
   * Streaming chat with async iteration and options support
   */
@@ -245,10 +296,31 @@ export class OllamaProvider extends MultiModalModel {
    const timeout = optionsArg.timeout || this.defaultTimeout;
    const modelOptions = { ...this.defaultOptions, ...optionsArg.options };

+    // Format history messages with optional images
+    const historyMessages = optionsArg.messageHistory.map((msg) => {
+      const formatted: { role: string; content: string; images?: string[] } = {
+        role: msg.role,
+        content: msg.content,
+      };
+      if (msg.images && msg.images.length > 0) {
+        formatted.images = msg.images;
+      }
+      return formatted;
+    });
+
+    // Build user message with optional images
+    const userMessage: { role: string; content: string; images?: string[] } = {
+      role: 'user',
+      content: optionsArg.userMessage,
+    };
+    if (optionsArg.images && optionsArg.images.length > 0) {
+      userMessage.images = optionsArg.images;
+    }
+
    const messages = [
      { role: 'system', content: optionsArg.systemMessage },
-      ...optionsArg.messageHistory,
-      { role: 'user', content: optionsArg.userMessage }
+      ...historyMessages,
+      userMessage,
    ];

    const response = await fetch(`${this.baseUrl}/api/chat`, {
@@ -338,10 +410,31 @@ export class OllamaProvider extends MultiModalModel {
    const timeout = optionsArg.timeout || this.defaultTimeout;
    const modelOptions = { ...this.defaultOptions, ...optionsArg.options };

+    // Format history messages with optional images
+    const historyMessages = optionsArg.messageHistory.map((msg) => {
+      const formatted: { role: string; content: string; images?: string[] } = {
+        role: msg.role,
+        content: msg.content,
+      };
+      if (msg.images && msg.images.length > 0) {
+        formatted.images = msg.images;
+      }
+      return formatted;
+    });
+
+    // Build user message with optional images
+    const userMessage: { role: string; content: string; images?: string[] } = {
+      role: 'user',
+      content: optionsArg.userMessage,
+    };
+    if (optionsArg.images && optionsArg.images.length > 0) {
+      userMessage.images = optionsArg.images;
+    }
+
    const messages = [
      { role: 'system', content: optionsArg.systemMessage },
-      ...optionsArg.messageHistory,
-      { role: 'user', content: optionsArg.userMessage }
+      ...historyMessages,
+      userMessage,
    ];

    const response = await fetch(`${this.baseUrl}/api/chat`, {
Author	SHA1	Message	Date
Juergen Kunz	ae8d3ccf33	v0.12.0 Some checks failed Default (tags) / security (push) Failing after 1s Details Default (tags) / test (push) Failing after 1s Details Default (tags) / release (push) Has been skipped Details Default (tags) / metadata (push) Has been skipped Details	2026-01-20 01:10:27 +00:00
Juergen Kunz	3b900d0ba9	feat(ollama): add support for base64-encoded images in chat messages and forward them to the Ollama provider	2026-01-20 01:10:27 +00:00
Juergen Kunz	d49152390f	v0.11.1	2026-01-20 00:37:59 +00:00
Juergen Kunz	d615ec9227	feat(streaming): add chatStreaming method with token callback for real-time generation progress - Add StreamingChatOptions interface with onToken callback - Add optional chatStreaming method to MultiModalModel abstract class - Implement chatStreaming in OllamaProvider using collectStreamResponse	2026-01-20 00:37:49 +00:00
Juergen Kunz	dfa863ee7d	v0.11.0 Some checks failed Default (tags) / security (push) Failing after 1s Details Default (tags) / test (push) Failing after 1s Details Default (tags) / release (push) Has been skipped Details Default (tags) / metadata (push) Has been skipped Details	2026-01-20 00:12:21 +00:00
Juergen Kunz	c84ede1f1d	feat(ollama): support defaultOptions and defaultTimeout for ollama provider	2026-01-20 00:12:21 +00:00