Spaces:

HumeAI
/

expressive-tts-arena

Running

zach commited on Feb 6

Commit

7f69677

1 Parent(s): 557e7ca

Update design to accomodate easily adding other TTS providers in the future

Files changed (2) hide show

src/app.py CHANGED Viewed

@@ -28,6 +28,7 @@ from src.constants import (
     PROMPT_MIN_LENGTH,
     SAMPLE_PROMPTS,
     TROPHY_EMOJI,
     VOTE_FOR_OPTION_A,
     VOTE_FOR_OPTION_B,
 )
@@ -108,24 +109,28 @@ def text_to_speech(
         logger.warning("Skipping text-to-speech due to empty text.")
         raise gr.Error("Please generate or enter text to synthesize.")
     # If not using generated text, then only compare Hume to Hume
-    compare_hume_with_elevenlabs = (text == generated_text_state) and (
-        random.random() < 0.5
     )
     try:
         with ThreadPoolExecutor(max_workers=2) as executor:
-            provider_a = HUME_AI
             future_audio_a = executor.submit(text_to_speech_with_hume, prompt, text)
-            if compare_hume_with_elevenlabs:
-                provider_b = ELEVENLABS
-                future_audio_b = executor.submit(
-                    text_to_speech_with_elevenlabs, prompt, text
-                )
-            else:
-                provider_b = HUME_AI
-                future_audio_b = executor.submit(text_to_speech_with_hume, prompt, text)
             audio_a = future_audio_a.result()
             audio_b = future_audio_b.result()

     PROMPT_MIN_LENGTH,
     SAMPLE_PROMPTS,
     TROPHY_EMOJI,
+    TTS_PROVIDERS,
     VOTE_FOR_OPTION_A,
     VOTE_FOR_OPTION_B,
 )
         logger.warning("Skipping text-to-speech due to empty text.")
         raise gr.Error("Please generate or enter text to synthesize.")
+    # Hume AI always included in comparison
+    provider_a = HUME_AI
     # If not using generated text, then only compare Hume to Hume
+    provider_b = (
+        HUME_AI if text != generated_text_state else random.choice(TTS_PROVIDERS)
     )
     try:
         with ThreadPoolExecutor(max_workers=2) as executor:
             future_audio_a = executor.submit(text_to_speech_with_hume, prompt, text)
+            match provider_b:
+                case ELEVENLABS:
+                    future_audio_b = executor.submit(
+                        text_to_speech_with_elevenlabs, prompt, text
+                    )
+                case HUME_AI:
+                    future_audio_b = executor.submit(
+                        text_to_speech_with_hume, prompt, text
+                    )
+                case _:
+                    raise ValueError(f"Unsupported provider: {provider_b}")
             audio_a = future_audio_a.result()
             audio_b = future_audio_b.result()

src/constants.py CHANGED Viewed

@@ -4,6 +4,9 @@ constants.py
 This module defines global constants used throughout the project.
 """
 # Third-Party Library Imports
 from src.types import OptionKey, TTSProviderName
@@ -11,6 +14,7 @@ from src.types import OptionKey, TTSProviderName
 # UI constants
 HUME_AI: TTSProviderName = "Hume AI"
 ELEVENLABS: TTSProviderName = "ElevenLabs"
 PROMPT_MIN_LENGTH: int = 20
 PROMPT_MAX_LENGTH: int = 800

 This module defines global constants used throughout the project.
 """
+# Standard Library Imports
+from typing import List
 # Third-Party Library Imports
 from src.types import OptionKey, TTSProviderName
 # UI constants
 HUME_AI: TTSProviderName = "Hume AI"
 ELEVENLABS: TTSProviderName = "ElevenLabs"
+TTS_PROVIDERS: List[TTSProviderName]
 PROMPT_MIN_LENGTH: int = 20
 PROMPT_MAX_LENGTH: int = 800