Spaces:

ABAO77
/

Run_code_api

Sleeping

App Files Files Community

ABAO77 commited on Sep 2

Commit

3fde6b6

1 Parent(s): 1ea1cfa

feat: add text cleaning functionality for TTS service to enhance input processing

Browse files

Files changed (3) hide show

src/agents/role_play/__pycache__/prompt.cpython-311.pyc +0 -0
src/services/tts_service.py +71 -2
test_tts_cleaning.py +151 -0

src/agents/role_play/__pycache__/prompt.cpython-311.pyc CHANGED Viewed

Binary files a/src/agents/role_play/__pycache__/prompt.cpython-311.pyc and b/src/agents/role_play/__pycache__/prompt.cpython-311.pyc differ

src/services/tts_service.py CHANGED Viewed

@@ -5,6 +5,7 @@ Text-to-Speech (TTS) Service using Deepgram API
 import requests
 import os
 import base64
 from src.utils.logger import logger
 from typing import Optional
@@ -20,6 +21,69 @@ class TTSService:
             logger.error("Deepgram API key not found in environment variables")
             raise ValueError("Deepgram API key is required")
     async def text_to_speech(
         self,
         text: str,
@@ -43,7 +107,12 @@ class TTSService:
                 return None
             # Clean and prepare text
-            cleaned_text = text.strip()
             if len(cleaned_text) > 2000:  # Limit text length for TTS
                 cleaned_text = cleaned_text[:2000] + "..."
                 logger.warning(f"Text truncated to 2000 characters for TTS")
@@ -57,7 +126,7 @@ class TTSService:
                 "Content-Type": "application/json"
             }
-            logger.info(f"Converting text to speech: {cleaned_text[:100]}...")
             # Make request to Deepgram API
             response = requests.post(

 import requests
 import os
 import base64
+import re
 from src.utils.logger import logger
 from typing import Optional
             logger.error("Deepgram API key not found in environment variables")
             raise ValueError("Deepgram API key is required")
+    def clean_text_for_speech(self, text: str) -> str:
+        """
+        Clean text for speech synthesis by removing problematic characters
+        Args:
+            text (str): The text to clean
+        Returns:
+            str: Cleaned text suitable for speech synthesis
+        """
+        if not text or not isinstance(text, str):
+            return ""
+        # Remove markdown formatting
+        text = re.sub(r'\*\*(.*?)\*\*', r'\1', text)  # Remove bold **text**
+        text = re.sub(r'\*(.*?)\*', r'\1', text)      # Remove italic *text*
+        text = re.sub(r'`(.*?)`', r'\1', text)        # Remove code `text`
+        text = re.sub(r'#{1,6}\s', '', text)          # Remove headers # ## ###
+        text = re.sub(r'\[(.*?)\]\(.*?\)', r'\1', text)  # Remove links [text](url) -> text
+        # Remove emojis and special unicode characters
+        # Emoticons
+        text = re.sub(r'[\U0001F600-\U0001F64F]', '', text)
+        # Misc symbols
+        text = re.sub(r'[\U0001F300-\U0001F5FF]', '', text)
+        # Transport & map
+        text = re.sub(r'[\U0001F680-\U0001F6FF]', '', text)
+        # Regional indicators
+        text = re.sub(r'[\U0001F1E0-\U0001F1FF]', '', text)
+        # Misc symbols
+        text = re.sub(r'[\U00002600-\U000026FF]', '', text)
+        # Dingbats
+        text = re.sub(r'[\U00002700-\U000027BF]', '', text)
+        # Variation selectors
+        text = re.sub(r'[\U0000FE00-\U0000FE0F]', '', text)
+        # Supplemental symbols
+        text = re.sub(r'[\U0001F900-\U0001F9FF]', '', text)
+        # Remove problematic punctuation and special characters
+        text = re.sub(r'[""'']', '"', text)    # Replace smart quotes with regular quotes
+        text = re.sub(r'[–—]', '-', text)      # Replace em/en dashes with hyphens
+        text = re.sub(r'[…]', '...', text)     # Replace ellipsis character
+        text = re.sub(r'[«»]', '"', text)      # Replace angle quotes
+        text = re.sub(r'[‹›]', "'", text)      # Replace single angle quotes
+        # Remove control characters and zero-width characters
+        text = re.sub(r'[\u200B-\u200D\uFEFF]', '', text)  # Zero-width chars
+        text = re.sub(r'[\u0000-\u001F\u007F-\u009F]', '', text)  # Control chars
+        # Clean up extra whitespace
+        text = re.sub(r'\s+', ' ', text)       # Multiple spaces to single space
+        text = text.strip()                    # Trim leading/trailing spaces
+        # Remove multiple consecutive punctuation
+        text = re.sub(r'\.{3,}', '...', text)  # Multiple dots to ellipsis
+        text = re.sub(r'!{2,}', '!', text)     # Multiple exclamations to single
+        text = re.sub(r'\?{2,}', '?', text)    # Multiple questions to single
+        # Ensure proper sentence endings
+        text = re.sub(r'([.!?])\s*([A-Z])', r'\1 \2', text)  # Space after sentence endings
+        return text
     async def text_to_speech(
         self,
         text: str,
                 return None
             # Clean and prepare text
+            cleaned_text = self.clean_text_for_speech(text)
+            if not cleaned_text or not cleaned_text.strip():
+                logger.warning("Text became empty after cleaning for TTS")
+                return None
             if len(cleaned_text) > 2000:  # Limit text length for TTS
                 cleaned_text = cleaned_text[:2000] + "..."
                 logger.warning(f"Text truncated to 2000 characters for TTS")
                 "Content-Type": "application/json"
             }
+            logger.info(f"Converting text to speech: '{cleaned_text[:100]}...' (original: '{text[:50]}...')")
             # Make request to Deepgram API
             response = requests.post(

test_tts_cleaning.py ADDED Viewed

	@@ -0,0 +1,151 @@

+#!/usr/bin/env python3
+"""
+Test script for TTS text cleaning functionality
+"""
+import sys
+import os
+# Add the parent directory to sys.path to import from src
+sys.path.append(os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
+from src.services.tts_service import TTSService
+def test_text_cleaning():
+    """Test the text cleaning functionality"""
+    print("🧪 Testing TTS Text Cleaning Function\n")
+    # Create TTS service instance (without API key for testing cleaning function only)
+    os.environ["YOUR_DEEPGRAM_API_KEY"] = "test_key"  # Dummy key for testing
+    try:
+        tts = TTSService()
+    except:
+        # If there are import issues, create a simple test version
+        class TestTTSService:
+            def clean_text_for_speech(self, text):
+                import re
+                if not text or not isinstance(text, str):
+                    return ""
+                # Remove markdown formatting
+                text = re.sub(r'\*\*(.*?)\*\*', r'\1', text)  # Remove bold **text**
+                text = re.sub(r'\*(.*?)\*', r'\1', text)      # Remove italic *text*
+                text = re.sub(r'`(.*?)`', r'\1', text)        # Remove code `text`
+                text = re.sub(r'#{1,6}\s', '', text)          # Remove headers # ## ###
+                text = re.sub(r'\[(.*?)\]\(.*?\)', r'\1', text)  # Remove links [text](url) -> text
+                # Remove emojis and special unicode characters
+                text = re.sub(r'[\U0001F600-\U0001F64F]', '', text)
+                text = re.sub(r'[\U0001F300-\U0001F5FF]', '', text)
+                text = re.sub(r'[\U0001F680-\U0001F6FF]', '', text)
+                text = re.sub(r'[\U0001F1E0-\U0001F1FF]', '', text)
+                text = re.sub(r'[\U00002600-\U000026FF]', '', text)
+                text = re.sub(r'[\U00002700-\U000027BF]', '', text)
+                text = re.sub(r'[\U0000FE00-\U0000FE0F]', '', text)
+                text = re.sub(r'[\U0001F900-\U0001F9FF]', '', text)
+                # Remove problematic punctuation and special characters
+                text = re.sub(r'[""'']', '"', text)
+                text = re.sub(r'[–—]', '-', text)
+                text = re.sub(r'[…]', '...', text)
+                text = re.sub(r'[«»]', '"', text)
+                text = re.sub(r'[‹›]', "'", text)
+                # Remove control characters and zero-width characters
+                text = re.sub(r'[\u200B-\u200D\uFEFF]', '', text)
+                text = re.sub(r'[\u0000-\u001F\u007F-\u009F]', '', text)
+                # Clean up extra whitespace
+                text = re.sub(r'\s+', ' ', text)
+                text = text.strip()
+                # Remove multiple consecutive punctuation
+                text = re.sub(r'\.{3,}', '...', text)
+                text = re.sub(r'!{2,}', '!', text)
+                text = re.sub(r'\?{2,}', '?', text)
+                # Ensure proper sentence endings
+                text = re.sub(r'([.!?])\s*([A-Z])', r'\1 \2', text)
+                return text
+        tts = TestTTSService()
+    # Test cases
+    test_cases = [
+        {
+            "name": "Simple text",
+            "input": "Hello, how are you today?",
+            "expected_clean": True
+        },
+        {
+            "name": "Text with emojis",
+            "input": "Great job! 🎉 You're doing amazing! 🌟 Keep it up! 💪",
+            "expected_clean": True
+        },
+        {
+            "name": "Markdown formatting",
+            "input": "This is **bold** and this is *italic* and `code`",
+            "expected_clean": True
+        },
+        {
+            "name": "Complex markdown with links",
+            "input": "Check out [this link](https://example.com) and ## Header text",
+            "expected_clean": True
+        },
+        {
+            "name": "Mixed content",
+            "input": "🎯 **Practice Goal**: Learn English conversation skills! Visit [our website](https://wise.com) for more tips. 📚✨",
+            "expected_clean": True
+        },
+        {
+            "name": "Smart quotes and dashes",
+            "input": "\"Hello world\" and 'smart quotes' with em—dash and en–dash…",
+            "expected_clean": True
+        },
+        {
+            "name": "Multiple punctuation",
+            "input": "Wow!!! This is amazing??? Really......",
+            "expected_clean": True
+        },
+        {
+            "name": "Real AI response",
+            "input": "🌟 **Excellent!** You did a great job with that conversation! Here are some tips:\n\n- Use *natural* expressions\n- Practice `daily`\n- Visit [practice site](https://example.com)\n\n💪 Keep practicing! 🎯",
+            "expected_clean": True
+        }
+    ]
+    print("Testing text cleaning function:\n")
+    for i, test_case in enumerate(test_cases, 1):
+        print(f"Test {i}: {test_case['name']}")
+        print(f"Input:  '{test_case['input']}'")
+        cleaned = tts.clean_text_for_speech(test_case['input'])
+        print(f"Output: '{cleaned}'")
+        # Check if cleaning was successful
+        has_emojis = any(char for char in cleaned if ord(char) > 127 and (
+            0x1F600 <= ord(char) <= 0x1F64F or  # Emoticons
+            0x1F300 <= ord(char) <= 0x1F5FF or  # Misc symbols
+            0x1F680 <= ord(char) <= 0x1F6FF or  # Transport
+            0x2600 <= ord(char) <= 0x26FF       # Misc symbols
+        ))
+        has_markdown = '**' in cleaned or '*' in cleaned or '`' in cleaned or '#' in cleaned
+        if has_emojis:
+            print("❌ Still contains emojis")
+        elif has_markdown:
+            print("❌ Still contains markdown")
+        elif not cleaned.strip():
+            print("⚠️  Text became empty after cleaning")
+        else:
+            print("✅ Cleaned successfully")
+        print("-" * 50)
+        print()
+if __name__ == "__main__":
+    test_text_cleaning()