From bbd8770205ef910c618bf29ee028b17344201c5c Mon Sep 17 00:00:00 2001 From: Juergen Kunz Date: Wed, 8 Oct 2025 22:56:53 +0000 Subject: [PATCH] fix(provider.elevenlabs): Update ElevenLabs default TTS model to eleven_v3 and add local Claude permissions file --- changelog.md | 6 ++++++ readme.md | 8 ++++---- ts/00_commitinfo_data.ts | 2 +- ts/provider.elevenlabs.ts | 2 +- 4 files changed, 12 insertions(+), 6 deletions(-) diff --git a/changelog.md b/changelog.md index 4c8d242..bd9c01a 100644 --- a/changelog.md +++ b/changelog.md @@ -1,5 +1,11 @@ # Changelog +## 2025-10-08 - 0.7.5 - fix(provider.elevenlabs) +Update ElevenLabs default TTS model to eleven_v3 and add local Claude permissions file + +- Changed default ElevenLabs modelId from 'eleven_multilingual_v2' to 'eleven_v3' in ts/provider.elevenlabs.ts to use the newer/default TTS model. +- Added .claude/settings.local.json with a permissions allow-list for local Claude tooling and CI tasks. + ## 2025-10-03 - 0.7.4 - fix(provider.anthropic) Use image/png for embedded PDF images in Anthropic provider and add local Claude settings for development permissions diff --git a/readme.md b/readme.md index feaa091..7d8fd18 100644 --- a/readme.md +++ b/readme.md @@ -53,7 +53,7 @@ Choose the right provider for your use case: |----------|:----:|:---------:|:---:|:------:|:---------:|:--------:|:------:|------------| | **OpenAI** | ✅ | ✅ | ✅ | ✅ | ✅ | ✅ | ✅ | • gpt-image-1
• DALL-E 3
• Deep research API | | **Anthropic** | ✅ | ✅ | ❌ | ✅ | ✅ | ✅ | ❌ | • Claude Sonnet 4.5
• Superior reasoning
• Web search API | -| **ElevenLabs** | ❌ | ❌ | ✅ | ❌ | ❌ | ❌ | ❌ | • Premium TTS
• 32 languages
• Natural voices | +| **ElevenLabs** | ❌ | ❌ | ✅ | ❌ | ❌ | ❌ | ❌ | • Premium TTS
• 70+ languages
• Natural voices | | **Ollama** | ✅ | ✅ | ❌ | ✅ | ✅ | ❌ | ❌ | • 100% local
• Privacy-first
• No API costs | | **XAI** | ✅ | ✅ | ❌ | ❌ | ✅ | ❌ | ❌ | • Grok models
• Real-time data
• Uncensored | | **Perplexity** | ✅ | ✅ | ❌ | ❌ | ❌ | ✅ | ❌ | • Web-aware
• Research-focused
• Sonar Pro models | @@ -118,11 +118,11 @@ const audioStream = await ai.openaiProvider.audio({ message: 'Welcome to the future of AI development!' }); -// ElevenLabs TTS - Premium quality, natural voices +// ElevenLabs TTS - Premium quality, natural voices (uses v3 by default) const elevenLabsAudio = await ai.elevenlabsProvider.audio({ message: 'Experience the most lifelike text to speech technology.', voiceId: '19STyYD15bswVz51nqLf', // Optional: Samara voice - modelId: 'eleven_multilingual_v2', // Optional: defaults to eleven_multilingual_v2 + modelId: 'eleven_v3', // Optional: defaults to eleven_v3 (70+ languages, most expressive) voiceSettings: { // Optional: fine-tune voice characteristics stability: 0.5, // 0-1: Speech consistency similarity_boost: 0.8, // 0-1: Voice similarity to original @@ -594,7 +594,7 @@ export ELEVENLABS_API_KEY=sk-... | **Complex Reasoning** | Anthropic | Superior logical thinking, safer outputs | | **Research & Facts** | Perplexity | Web-aware, provides citations | | **Deep Research** | OpenAI | Deep Research API with comprehensive analysis | -| **Premium TTS** | ElevenLabs | Most natural voices, 32 languages, superior quality | +| **Premium TTS** | ElevenLabs | Most natural voices, 70+ languages, superior quality (v3) | | **Speed Critical** | Groq | 10x faster inference, sub-second responses | | **Privacy Critical** | Ollama | 100% local, no data leaves your servers | | **Real-time Data** | XAI | Access to current information | diff --git a/ts/00_commitinfo_data.ts b/ts/00_commitinfo_data.ts index ed11e3e..561cd88 100644 --- a/ts/00_commitinfo_data.ts +++ b/ts/00_commitinfo_data.ts @@ -3,6 +3,6 @@ */ export const commitinfo = { name: '@push.rocks/smartai', - version: '0.7.4', + version: '0.7.5', description: 'SmartAi is a versatile TypeScript library designed to facilitate integration and interaction with various AI models, offering functionalities for chat, audio generation, document processing, and vision tasks.' } diff --git a/ts/provider.elevenlabs.ts b/ts/provider.elevenlabs.ts index 50a3019..e689936 100644 --- a/ts/provider.elevenlabs.ts +++ b/ts/provider.elevenlabs.ts @@ -61,7 +61,7 @@ export class ElevenLabsProvider extends MultiModalModel { throw new Error('Voice ID is required for ElevenLabs TTS. Please provide voiceId in the method call or set defaultVoiceId in provider options.'); } - const modelId = optionsArg.modelId || this.options.defaultModelId || 'eleven_multilingual_v2'; + const modelId = optionsArg.modelId || this.options.defaultModelId || 'eleven_v3'; const url = `${this.baseUrl}/text-to-speech/${voiceId}`;