ell tts support speech and pronunciation_dictionary_locators (#1137)

2025-12-20 08:40:38 +00:00 · 2025-04-09 23:32:06 +07:00
parent c708b7d007
commit 77f0fc85a3
1 changed files with 9 additions and 2 deletions
--- a/lib/tasks/tts-task.js
+++ b/lib/tasks/tts-task.js
@@ -65,7 +65,6 @@ class TtsTask extends Task {

  async setTtsStreamingChannelVars(vendor, language, voice, credentials, ep) {
    const {api_key, model_id, custom_tts_streaming_url, auth_token} = credentials;
-    const {stability, similarity_boost, use_speaker_boost, style} = this.options;
    let obj;

    this.logger.debug({credentials},
@@ -87,6 +86,7 @@ class TtsTask extends Task {
        };
        break;
      case 'elevenlabs':
+        const {stability, similarity_boost, use_speaker_boost, style, speed} = this.options.voice_settings || {};
        obj = {
          ELEVENLABS_API_KEY: api_key,
          ELEVENLABS_TTS_STREAMING_MODEL_ID: model_id,
@@ -96,7 +96,14 @@ class TtsTask extends Task {
          ...(stability && {ELEVENLABS_TTS_STREAMING_VOICE_SETTINGS_STABILITY: stability}),
          ...(similarity_boost && {ELEVENLABS_TTS_STREAMING_VOICE_SETTINGS_SIMILARITY_BOOST: similarity_boost}),
          ...(use_speaker_boost && {ELEVENLABS_TTS_STREAMING_VOICE_SETTINGS_USE_SPEAKER_BOOST: use_speaker_boost}),
-          ...(style && {ELEVENLABS_TTS_STREAMING_VOICE_SETTINGS_STYLE: style})
+          ...(style && {ELEVENLABS_TTS_STREAMING_VOICE_SETTINGS_STYLE: style}),
+          // speed has value 0.7 to 1.2, 1.0 is default, make sure we send the value event it's 0
+          ...(speed !== null && speed !== undefined && {ELEVENLABS_TTS_STREAMING_VOICE_SETTINGS_SPEED: `${speed}`}),
+          ...(this.options.pronunciation_dictionary_locators &&
+            Array.isArray(this.options.pronunciation_dictionary_locators) && {
+            ELEVENLABS_TTS_STREAMING_PRONUNCIATION_DICTIONARY_LOCATORS:
+            JSON.stringify(this.options.pronunciation_dictionary_locators)
+          }),
        };
        break;
      case 'rimelabs':