From 746caea83fa8028061ea93486ab8c9e4bf873bce Mon Sep 17 00:00:00 2001 From: Kaustubh Maske Patil <37668193+nikochiko@users.noreply.github.com> Date: Mon, 20 Nov 2023 14:50:14 +0530 Subject: [PATCH] 11labs: Add turbo model and extra language **Changes:** * Add eleven turbo model for extremely low-latency English TTS * Add 29th supported language for multilingual v2 model * Remove trailing space in text_to_speech_widget file --- .../text_to_speech_settings_widgets.py | 35 ++++++++++--------- 1 file changed, 18 insertions(+), 17 deletions(-) diff --git a/daras_ai_v2/text_to_speech_settings_widgets.py b/daras_ai_v2/text_to_speech_settings_widgets.py index 110edc279..0526c441f 100644 --- a/daras_ai_v2/text_to_speech_settings_widgets.py +++ b/daras_ai_v2/text_to_speech_settings_widgets.py @@ -76,42 +76,43 @@ class TextToSpeechProviders(Enum): # Mapping from Model ID -> Title in UI ELEVEN_LABS_MODELS = { - "eleven_multilingual_v2": "Multilingual V2", - "eleven_monolingual_v1": "English V1 - Low latency English TTS", + "eleven_multilingual_v2": "Multilingual V2 - High quality speech in 29 languages", + "eleven_turbo_v2": "English V2 - Very low latency text-to-speech", + "eleven_monolingual_v1": "English V1 - Low latency text-to-speech", } ELEVEN_LABS_SUPPORTED_LANGS = [ "English", + "Japanese", "Chinese", - "Spanish", + "German", "Hindi", - "Portuguese", "French", - "German", - "Japanese", - "Arabic", "Korean", - "Indonesian", + "Portuguese", "Italian", + "Spanish", + "Indonesian", "Dutch", "Turkish", + "Filipino", "Polish", "Swedish", - "Filipino", - "Malay", + "Bulgarian", "Romanian", - "Ukrainian", - "Greek", + "Arabic", "Czech", - "Danish", + "Greek", "Finnish", - "Bulgarian", "Croatian", + "Malay", "Slovak", + "Danish", "Tamil", + "Ukrainian", + "Russian", ] - BARK_SUPPORTED_LANGS = [ ("English", "en"), ("German", "de"), @@ -184,7 +185,7 @@ def text_to_speech_settings(page): with col1: st.slider( """ - ###### Speaking rate + ###### Speaking rate *`1.0` is the normal native speed of the speaker* """, min_value=0.3, @@ -219,7 +220,7 @@ def text_to_speech_settings(page): with col1: st.slider( """ - ###### Speaking rate + ###### Speaking rate *`1.0` is the normal native speed of the speaker* """, min_value=0.5,