5 Commits

Author SHA1 Message Date
9e19d320e1 0.0.11 2024-04-27 12:47:50 +02:00
158d49fa95 fix(core): update 2024-04-27 12:47:49 +02:00
1ce412fd00 0.0.10 2024-04-25 10:49:08 +02:00
92c382c16e fix(core): update 2024-04-25 10:49:07 +02:00
63d3b7c9bb update tsconfig 2024-04-14 17:19:32 +02:00
15 changed files with 887 additions and 553 deletions

View File

@ -16,7 +16,10 @@
"text-to-speech",
"conversation stream",
"TypeScript",
"ESM"
"ESM",
"streaming API",
"modular design",
"development tool"
]
}
},

View File

@ -1,6 +1,6 @@
{
"name": "@push.rocks/smartai",
"version": "0.0.9",
"version": "0.0.11",
"private": false,
"description": "Provides a standardized interface for integrating and conversing with multiple AI models, supporting operations like chat and potentially audio responses.",
"main": "dist_ts/index.js",
@ -17,17 +17,21 @@
"@git.zone/tsbuild": "^2.1.25",
"@git.zone/tsbundle": "^2.0.5",
"@git.zone/tsrun": "^1.2.46",
"@git.zone/tstest": "^1.0.44",
"@push.rocks/tapbundle": "^5.0.15",
"@types/node": "^20.8.7"
"@git.zone/tstest": "^1.0.90",
"@push.rocks/qenv": "^6.0.5",
"@push.rocks/tapbundle": "^5.0.23",
"@types/node": "^20.12.7"
},
"dependencies": {
"@anthropic-ai/sdk": "^0.19.1",
"@push.rocks/qenv": "^6.0.5",
"@push.rocks/smartfile": "^11.0.4",
"@push.rocks/smartpath": "^5.0.11",
"@anthropic-ai/sdk": "^0.20.7",
"@push.rocks/smartarray": "^1.0.8",
"@push.rocks/smartfile": "^11.0.14",
"@push.rocks/smartpath": "^5.0.18",
"@push.rocks/smartpdf": "^3.1.5",
"@push.rocks/smartpromise": "^4.0.3",
"openai": "^4.31.0"
"@push.rocks/smartrequest": "^2.0.22",
"@push.rocks/webstream": "^1.0.8",
"openai": "^4.38.5"
},
"repository": {
"type": "git",
@ -59,6 +63,9 @@
"text-to-speech",
"conversation stream",
"TypeScript",
"ESM"
"ESM",
"streaming API",
"modular design",
"development tool"
]
}

1016
pnpm-lock.yaml generated

File diff suppressed because it is too large Load Diff

View File

@ -1,2 +1,4 @@
required:
- OPENAI_TOKEN
- OPENAI_TOKEN
- ANTHROPIC_TOKEN
- PERPLEXITY_TOKEN

1
readme.hints.md Normal file
View File

@ -0,0 +1 @@

View File

@ -1,108 +1,112 @@
# @push.rocks/smartai
a standardized interface to talk to AI models
Provides a standardized interface for integrating and conversing with multiple AI models, supporting operations like chat and potentially audio responses.
## Install
To install `@push.rocks/smartai`, run the following command in your terminal:
To add @push.rocks/smartai to your project, run the following command in your terminal:
```bash
npm install @push.rocks/smartai
```
This will add the package to your project's dependencies.
This command installs the package and adds it to your project's dependencies.
## Usage
In the following guide, you'll learn how to leverage `@push.rocks/smartai` for integrating AI models into your applications using TypeScript with ESM syntax.
The usage section delves into how to leverage the `@push.rocks/smartai` package to interact with AI models in an application. This package simplifies the integration and conversation with AI models by providing a standardized interface. The examples below demonstrate the package's capabilities in engaging with AI models for chat operations and potentially handling audio responses using TypeScript and ESM syntax.
### Getting Started
### Integrating AI Models
First, you'll need to import the necessary modules from `@push.rocks/smartai`. This typically includes the main `SmartAi` class along with any specific provider classes you intend to use, such as `OpenAiProvider` or `AnthropicProvider`.
#### Importing the Module
Start by importing `SmartAi` and the AI providers you wish to use from `@push.rocks/smartai`.
```typescript
import { SmartAi, OpenAiProvider, AnthropicProvider } from '@push.rocks/smartai';
```
### Initialization
#### Initializing `SmartAi`
Create an instance of `SmartAi` by providing the required options, which include authentication tokens for the AI providers you plan to use.
Create an instance of `SmartAi` with the necessary credentials for accessing the AI services.
```typescript
const smartAi = new SmartAi({
openaiToken: 'your-openai-token-here',
anthropicToken: 'your-anthropic-token-here'
openaiToken: 'your-openai-access-token',
anthropicToken: 'your-anthropic-access-token'
});
```
### Creating a Conversation
### Chatting with the AI
`@push.rocks/smartai` offers a versatile way to handle conversations with AI. To create a conversation using OpenAI, for instance:
#### Creating a Conversation
To begin a conversation, choose the AI provider you'd like to use. For instance, to use OpenAI:
```typescript
async function createOpenAiConversation() {
const conversation = await smartAi.createOpenApiConversation();
// Use the conversation for chatting
}
```
For Anthropic-based conversations:
Similarly, for an Anthropic AI conversation:
```typescript
async function createAnthropicConversation() {
const conversation = await smartAi.createAnthropicConversation();
// Use the conversation for chatting
}
```
### Advanced Usage: Streaming and Chat
### Streaming Chat with OpenAI
Advanced use cases might require direct access to the streaming APIs provided by the AI models. For instance, handling a chat stream with OpenAI can be achieved as follows:
#### Set Up the Conversation Stream
First, create a conversation and obtain the input and output streams.
For more advanced scenarios, like a streaming chat with OpenAI, you would interact with the chat stream directly:
```typescript
const conversation = await smartAi.createOpenApiConversation();
// Assuming a conversation has been created and initialized...
const inputStreamWriter = conversation.getInputStreamWriter();
const outputStream = conversation.getOutputStream();
```
#### Write to Input Stream
// Write a message to the input stream for the AI to process
await inputStreamWriter.write('Hello, how can I help you today?');
To send messages to the AI model, use the input stream writer.
```typescript
await inputStreamWriter.write('Hello, SmartAI!');
```
#### Processing Output Stream
Output from the AI model can be processed by reading from the output stream.
```typescript
// Listen to the output stream for responses from AI
const reader = outputStream.getReader();
reader.read().then(function processText({ done, value }) {
if (done) {
console.log("Stream complete");
console.log("No more messages from AI");
return;
}
console.log("Received from AI:", value);
console.log("AI says:", value);
// Continue reading messages
reader.read().then(processText);
});
```
### Handling Audio
### Handling Audio Responses
`@push.rocks/smartai` also supports handling audio responses from AI models. To generate and retrieve audio output:
The package may also support converting text responses from the AI into audio. While specific implementation details depend on the AI provider's capabilities, a generic approach would involve creating a text-to-speech instance and utilizing it:
```typescript
// This is a hypothetical function call as the implementation might vary
const tts = await TTS.createWithOpenAi(smartAi);
// The TTS instance would then be used to convert text to speech
```
This code snippet initializes text-to-speech (TTS) capabilities using the OpenAI model. Further customization and usage of audio APIs will depend on the capabilities offered by the specific AI model and provider you are working with.
### Extensive Feature Set
`@push.rocks/smartai` provides comprehensive support for interacting with various AI models, not limited to text chat. It encompasses audio responses, potentially incorporating AI-powered analyses, and other multi-modal interactions.
Refer to the specific AI providers documentation through `@push.rocks/smartai`, such as OpenAI and Anthropic, for detailed guidance on utilizing the full spectrum of capabilities, including the implementation of custom conversation flows, handling streaming data efficiently, and generating audio responses from AI conversations.
### Conclusion
`@push.rocks/smartai` offers a flexible and standardized interface for interacting with AI models, streamlining the development of applications that leverage AI capabilities. Through the outlined examples, you've seen how to initialize the library, create conversations, and handle both text and audio interactions with AI models in a TypeScript environment following ESM syntax.
Equipped with `@push.rocks/smartai`, developers can streamline the integration of sophisticated AI interactions into their applications. The package facilitates robust communication with AI models, supporting diverse operations from simple chats to complex audio feedback mechanisms, all within a unified, easy-to-use interface.
Explore the package more to uncover its full potential in creating engaging, AI-enhanced interactions in your applications.
For a comprehensive understanding of all features and to explore more advanced use cases, refer to the official [documentation](https://code.foss.global/push.rocks/smartai#readme) and check the `npmextra.json` file's `tsdocs` section for additional insights on module usage.
## License and Legal Information

View File

@ -1,8 +1,94 @@
import { expect, expectAsync, tap } from '@push.rocks/tapbundle';
import * as smartai from '../ts/index.js'
import * as qenv from '@push.rocks/qenv';
import * as smartrequest from '@push.rocks/smartrequest';
import * as smartfile from '@push.rocks/smartfile';
tap.test('first test', async () => {
console.log(smartai)
const testQenv = new qenv.Qenv('./', './.nogit/');
import * as smartai from '../ts/index.js';
let testSmartai: smartai.SmartAi;
tap.test('should create a smartai instance', async () => {
testSmartai = new smartai.SmartAi({
openaiToken: await testQenv.getEnvVarOnDemand('OPENAI_TOKEN'),
exposeCredentials: {
exposedBaseUrl: await testQenv.getEnvVarOnDemand('EXPOSED_BASE_URL'),
webdav: {
webdavCredentials: {
password: await testQenv.getEnvVarOnDemand('WEBDAV_SERVER_TOKEN'),
serverUrl: await testQenv.getEnvVarOnDemand('WEBDAV_SERVER_URL'),
},
webdavSubPath: 'smartai'
}
}
});
await testSmartai.start();
});
tap.test('should create chat response with openai', async () => {
const userMessage = 'How are you?';
const response = await testSmartai.openaiProvider.chat({
systemMessage: 'Hello',
userMessage: userMessage,
messageHistory: [
],
});
console.log(`userMessage: ${userMessage}`);
console.log(response.message.content);
});
tap.test('should document a pdf', async () => {
const pdfUrl = 'https://www.w3.org/WAI/ER/tests/xhtml/testfiles/resources/pdf/dummy.pdf';
const pdfResponse = await smartrequest.getBinary(pdfUrl);
const result = await testSmartai.openaiProvider.document({
systemMessage: 'Classify the document. Only the following answers are allowed: "invoice", "bank account statement", "contract", "other"',
userMessage: "Classify the document.",
messageHistory: [],
pdfDocuments: [pdfResponse.body],
});
console.log(result);
});
tap.test('should recognize companies in a pdf', async () => {
const pdfBuffer = await smartfile.fs.toBuffer('./.nogit/demo_without_textlayer.pdf');
const result = await testSmartai.openaiProvider.document({
systemMessage: `
summarize the document.
answer in JSON format, adhering to the following schema:
\`\`\`typescript
type TAnswer = {
entitySender: {
type: 'official state entity' | 'company' | 'person';
name: string;
address: string;
city: string;
country: string;
EU: boolean; // wether the entity is within EU
};
entityReceiver: {
type: 'official state entity' | 'company' | 'person';
name: string;
address: string;
city: string;
country: string;
EU: boolean; // wether the entity is within EU
};
date: string; // the date of the document as YYYY-MM-DD
title: string; // a short title, suitable for a filename
}
\`\`\`
`,
userMessage: "Classify the document.",
messageHistory: [],
pdfDocuments: [pdfBuffer],
});
console.log(result);
})
tap.start()
tap.test('should stop the smartai instance', async () => {
await testSmartai.stop();
});
export default tap.start();

View File

@ -3,6 +3,6 @@
*/
export const commitinfo = {
name: '@push.rocks/smartai',
version: '0.0.9',
version: '0.0.11',
description: 'Provides a standardized interface for integrating and conversing with multiple AI models, supporting operations like chat and potentially audio responses.'
}

View File

@ -8,8 +8,22 @@ export abstract class MultiModalModel {
* stops the model
*/
abstract stop(): Promise<void>;
public abstract chat(optionsArg: {
systemMessage: string,
userMessage: string,
messageHistory: {
role: 'assistant' | 'user';
content: string;
}[]
}): Promise<{}>
// Defines a streaming interface for chat interactions.
// The implementation will vary based on the specific AI model.
abstract chatStream(input: ReadableStream<string>): ReadableStream<string>;
/**
* Defines a streaming interface for chat interactions.
* The implementation will vary based on the specific AI model.
* @param input
*/
public abstract chatStream(input: ReadableStream<string>): Promise<ReadableStream<string>>;
}

View File

@ -1,18 +1,39 @@
import { Conversation } from './classes.conversation.js';
import * as plugins from './plugins.js';
import type { AnthropicProvider } from './provider.anthropic.js';
import type { OllamaProvider } from './provider.ollama.js';
import { OpenAiProvider } from './provider.openai.js';
import type { PerplexityProvider } from './provider.perplexity.js';
export interface ISmartAiOptions {
openaiToken: string;
anthropicToken: string;
openaiToken?: string;
anthropicToken?: string;
perplexityToken?: string;
}
export class SmartAi {
public options: ISmartAiOptions;
public openaiProvider: OpenAiProvider;
public anthropicProvider: AnthropicProvider;
public perplexityProvider: PerplexityProvider;
public ollamaProvider: OllamaProvider;
constructor(optionsArg: ISmartAiOptions) {
this.options = optionsArg;
}
public async start() {
if (this.options.openaiToken) {
this.openaiProvider = new OpenAiProvider({
openaiToken: this.options.openaiToken,
});
await this.openaiProvider.start();
}
}
public async stop() {}
/**
* creates an OpenAI conversation

0
ts/interfaces.ts Normal file
View File

View File

@ -7,15 +7,23 @@ export {
// @push.rocks scope
import * as qenv from '@push.rocks/qenv';
import * as smartpath from '@push.rocks/smartpath';
import * as smartpromise from '@push.rocks/smartpromise';
import * as smartarray from '@push.rocks/smartarray';
import * as smartfile from '@push.rocks/smartfile';
import * as smartpath from '@push.rocks/smartpath';
import * as smartpdf from '@push.rocks/smartpdf';
import * as smartpromise from '@push.rocks/smartpromise';
import * as smartrequest from '@push.rocks/smartrequest';
import * as webstream from '@push.rocks/webstream';
export {
smartarray,
qenv,
smartpath,
smartpromise,
smartfile,
smartpath,
smartpdf,
smartpromise,
smartrequest,
webstream,
}
// third party

3
ts/provider.ollama.ts Normal file
View File

@ -0,0 +1,3 @@
import * as plugins from './plugins.js';
export class OllamaProvider {}

View File

@ -3,67 +3,53 @@ import * as paths from './paths.js';
import { MultiModalModel } from './abstract.classes.multimodal.js';
export class OpenAiProvider extends MultiModalModel {
private openAiToken: string;
public openAiApiClient: plugins.openai.default;
export interface IOpenaiProviderOptions {
openaiToken: string;
}
constructor(openaiToken: string) {
export class OpenAiProvider extends MultiModalModel {
private options: IOpenaiProviderOptions;
public openAiApiClient: plugins.openai.default;
public smartpdfInstance: plugins.smartpdf.SmartPdf;
constructor(optionsArg: IOpenaiProviderOptions) {
super();
this.openAiToken = openaiToken; // Ensure the token is stored
this.options = optionsArg;
}
async start() {
public async start() {
this.openAiApiClient = new plugins.openai.default({
apiKey: this.openAiToken,
apiKey: this.options.openaiToken,
dangerouslyAllowBrowser: true,
});
this.smartpdfInstance = new plugins.smartpdf.SmartPdf();
}
async stop() {}
public async stop() {}
chatStream(input: ReadableStream<string>): ReadableStream<string> {
const decoder = new TextDecoder();
let messageHistory: { role: 'assistant' | 'user'; content: string }[] = [];
public async chatStream(input: ReadableStream<string>): Promise<ReadableStream<string>> {
// TODO: implement for OpenAI
return new ReadableStream({
async start(controller) {
const reader = input.getReader();
try {
let done, value;
while ((({ done, value } = await reader.read()), !done)) {
const userMessage = decoder.decode(value, { stream: true });
messageHistory.push({ role: 'user', content: userMessage });
const aiResponse = await this.chat('', userMessage, messageHistory);
messageHistory.push({ role: 'assistant', content: aiResponse.message });
// Directly enqueue the string response instead of encoding it first
controller.enqueue(aiResponse.message);
}
controller.close();
} catch (err) {
controller.error(err);
}
},
});
const returnStream = new ReadableStream();
return returnStream;
}
// Implementing the synchronous chat interaction
public async chat(
systemMessage: string,
userMessage: string,
public async chat(optionsArg: {
systemMessage: string;
userMessage: string;
messageHistory: {
role: 'assistant' | 'user';
content: string;
}[]
) {
}[];
}) {
const result = await this.openAiApiClient.chat.completions.create({
model: 'gpt-4-turbo-preview',
messages: [
{ role: 'system', content: systemMessage },
...messageHistory,
{ role: 'user', content: userMessage },
{ role: 'system', content: optionsArg.systemMessage },
...optionsArg.messageHistory,
{ role: 'user', content: optionsArg.userMessage },
],
});
return {
@ -71,19 +57,77 @@ export class OpenAiProvider extends MultiModalModel {
};
}
public async audio(messageArg: string) {
const done = plugins.smartpromise.defer();
public async audio(optionsArg: { message: string }): Promise<NodeJS.ReadableStream> {
const done = plugins.smartpromise.defer<NodeJS.ReadableStream>();
const result = await this.openAiApiClient.audio.speech.create({
model: 'tts-1-hd',
input: messageArg,
input: optionsArg.message,
voice: 'nova',
response_format: 'mp3',
speed: 1,
});
const stream = result.body.pipe(plugins.smartfile.fsStream.createWriteStream(plugins.path.join(paths.nogitDir, 'output.mp3')));
stream.on('finish', () => {
done.resolve();
});
const stream = result.body;
done.resolve(stream);
return done.promise;
}
public async document(optionsArg: {
systemMessage: string;
userMessage: string;
pdfDocuments: Uint8Array[];
messageHistory: {
role: 'assistant' | 'user';
content: any;
}[];
}) {
let pdfDocumentImageBytesArray: Uint8Array[] = [];
for (const pdfDocument of optionsArg.pdfDocuments) {
const documentImageArray = await this.smartpdfInstance.convertPDFToPngBytes(pdfDocument);
pdfDocumentImageBytesArray = pdfDocumentImageBytesArray.concat(documentImageArray);
}
console.log(`image smartfile array`);
console.log(pdfDocumentImageBytesArray.map((smartfile) => smartfile.length));
const smartfileArray = await plugins.smartarray.map(
pdfDocumentImageBytesArray,
async (pdfDocumentImageBytes) => {
return plugins.smartfile.SmartFile.fromBuffer(
'pdfDocumentImage.jpg',
Buffer.from(pdfDocumentImageBytes)
);
}
);
const result = await this.openAiApiClient.chat.completions.create({
model: 'gpt-4-vision-preview',
// response_format: { type: "json_object" }, // not supported for now
messages: [
{ role: 'system', content: optionsArg.systemMessage },
...optionsArg.messageHistory,
{
role: 'user',
content: [
{ type: 'text', text: optionsArg.userMessage },
...(() => {
const returnArray = [];
for (const imageBytes of pdfDocumentImageBytesArray) {
returnArray.push({
type: 'image_url',
image_url: {
url: 'data:image/png;base64,' + Buffer.from(imageBytes).toString('base64'),
},
});
}
return returnArray;
})(),
],
},
],
});
return {
message: result.choices[0].message,
};
}
}

View File

@ -0,0 +1,3 @@
import * as plugins from './plugins.js';
export class PerplexityProvider {}