Spaces:

LocaleNLP
/

LocaleNLP_Translator

Runtime error

App Files Files Community

Mgolo commited on Sep 17

Commit

1aee8e8

verified ·

1 Parent(s): 8c3c59b

Update app.py

Browse files

Files changed (1) hide show

app.py +536 -225

app.py CHANGED Viewed

@@ -1,9 +1,22 @@
 import os
 import re
-import tempfile
 import logging
-from typing import Optional, Dict, Tuple, Any
 from pathlib import Path
 import gradio as gr
 import torch
@@ -11,256 +24,554 @@ import whisper
 import fitz  # PyMuPDF
 import docx
 from bs4 import BeautifulSoup
-import markdown2
 import chardet
 from transformers import pipeline, MarianTokenizer, AutoModelForSeq2SeqLM
-# -------------------------------
-# Configuration & Logging Setup
-# -------------------------------
-logging.basicConfig(level=logging.INFO)
-logger = logging.getLogger(__name__)
-DEVICE = torch.device("cuda" if torch.cuda.is_available() else "cpu")
-HF_TOKEN = os.getenv("hffff")
-# Language Pair Models
-MODELS: Dict[Tuple[str, str], Dict[str, str]] = {
-    ("English", "Wolof"): {"model_name": "LocaleNLP/localenlp-eng-wol-0.03", "tag": ">>wol<<"},
-    ("Wolof", "English"): {"model_name": "LocaleNLP/localenlp-wol-eng-0.03", "tag": ">>eng<<"},
-    ("English", "Hausa"): {"model_name": "LocaleNLP/localenlp-eng-hau-0.01", "tag": ">>hau<<"},
-    ("Hausa", "English"): {"model_name": "LocaleNLP/localenlp-hau-eng-0.01", "tag": ">>eng<<"},
-    ("English", "Darija"): {"model_name": "LocaleNLP/english_darija", "tag": ">>dar<<"}
-}
-SUPPORTED_LANGUAGES = ["English", "Wolof", "Hausa", "Darija"]
-INPUT_MODES = ["Text", "Audio", "File"]
-SUPPORTED_FILE_TYPES = [".pdf", ".docx", ".html", ".htm", ".md", ".srt", ".txt"]
-# -------------------------------
-# Model Manager
-# -------------------------------
 class ModelManager:
-    """Manages loading and caching of translation and transcription models."""
     def __init__(self):
-        self.translation_pipeline = None
-        self.whisper_model = None
-    def load_translation_model(self, src_lang: str, tgt_lang: str) -> Tuple[Any, str]:
-        key = (src_lang, tgt_lang)
-        if key not in MODELS:
-            raise ValueError(f"Unsupported language pair: {src_lang} -> {tgt_lang}")
-        config = MODELS[key]
-        model_name = config["model_name"]
-        lang_tag = config["tag"]
-        if self.translation_pipeline is None or self.translation_pipeline.model.config._name_or_path != model_name:
-            logger.info(f"Loading translation model: {model_name}")
-            model = AutoModelForSeq2SeqLM.from_pretrained(model_name, token=HF_TOKEN).to(DEVICE)
-            tokenizer = MarianTokenizer.from_pretrained(model_name, token=HF_TOKEN)
-            self.translation_pipeline = pipeline(
                 "translation",
                 model=model,
                 tokenizer=tokenizer,
-                device=0 if DEVICE.type == "cuda" else -1
             )
-        return self.translation_pipeline, lang_tag
-    def load_whisper_model(self) -> Any:
-        if self.whisper_model is None:
             logger.info("Loading Whisper base model...")
-            self.whisper_model = whisper.load_model("base")
-        return self.whisper_model
-# -------------------------------
-# File Processing Utilities
-# -------------------------------
-def extract_text_from_file(file_path: str) -> str:
-    """Extracts text from various file types."""
-    ext = Path(file_path).suffix.lower()
-    content = Path(file_path).read_bytes()
-    if ext == ".pdf":
         with fitz.open(stream=content, filetype="pdf") as doc:
             return "\n".join(page.get_text() for page in doc)
-    elif ext == ".docx":
-        doc = docx.Document(file_path)
-        return "\n".join(p.text for p in doc.paragraphs)
-    elif ext in (".html", ".htm"):
-        return BeautifulSoup(content.decode("utf-8", errors="ignore"), "html.parser").get_text()
-    elif ext == ".md":
-        html = markdown2.markdown(content.decode("utf-8", errors="ignore"))
-        return BeautifulSoup(html, "html.parser").get_text()
-    elif ext == ".srt":
-        decoded = content.decode("utf-8", errors="ignore")
-        return re.sub(r"\d+\n\d{2}:\d{2}:\d{2},\d{3} --> .*?\n", "", decoded)
-    elif ext in (".txt", ".text"):
-        encoding = chardet.detect(content)["encoding"]
-        return content.decode(encoding or "utf-8", errors="ignore")
-    else:
-        raise ValueError(f"Unsupported file type: {ext}")
-# -------------------------------
-# Translation Logic
-# -------------------------------
-def translate_text(text: str, src_lang: str, tgt_lang: str, model_manager: ModelManager) -> str:
-    """Translates input text using the specified language pair."""
-    pipe, tag = model_manager.load_translation_model(src_lang, tgt_lang)
-    paragraphs = text.splitlines()
-    translated_output = []
-    with torch.no_grad():
-        for para in paragraphs:
-            if not para.strip():
-                translated_output.append("")
-                continue
-            sentences = [s.strip() for s in para.split(". ") if s.strip()]
-            formatted = [f"{tag} {sentence}" for sentence in sentences]
-            results = pipe(
-                formatted,
-                max_length=5000,
-                num_beams=5,
-                early_stopping=True,
-                no_repeat_ngram_size=3,
-                repetition_penalty=1.5,
-                length_penalty=1.2
             )
-            translated_sentences = [r["translation_text"].capitalize() for r in results]
-            translated_output.append(". ".join(translated_sentences))
-    return "\n".join(translated_output)
-# -------------------------------
-# Audio Transcription
-# -------------------------------
-def transcribe_audio(file_path: str, model_manager: ModelManager) -> str:
-    """Transcribes audio file using Whisper."""
-    model = model_manager.load_whisper_model()
-    result = model.transcribe(file_path)
-    return result["text"]
-# -------------------------------
-# Main Processing Function
-# -------------------------------
-def process_input(
-    mode: str,
-    src_lang: str,
-    text_input: str,
-    audio_path: Optional[str],
-    file_obj: Optional[gr.FileData]
-) -> str:
-    """Processes input based on selected mode."""
-    if mode == "Text":
-        return text_input
-    elif mode == "Audio":
-        if src_lang != "English":
-            raise ValueError("Audio input must be in English.")
-        if not audio_path:
-            raise ValueError("No audio file uploaded.")
-        return transcribe_audio(audio_path, model_manager)
-    elif mode == "File":
-        if not file_obj:
-            raise ValueError("No file uploaded.")
-        return extract_text_from_file(file_obj.name)
-    return ""
-# -------------------------------
-# Gradio UI Logic
-# -------------------------------
-model_manager = ModelManager()
-def update_visibility(mode: str) -> Dict[str, Any]:
-    """Update visibility of input components based on selected mode."""
-    return {
-        input_text: gr.update(visible=(mode == "Text")),
-        audio_input: gr.update(visible=(mode == "Audio")),
-        file_input: gr.update(visible=(mode == "File")),
-        extracted_text: gr.update(value="", visible=True),
-        output_text: gr.update(value="")
-    }
-def handle_process(
-    mode: str,
-    src_lang: str,
-    text_input: str,
-    audio_path: Optional[str],
-    file_obj: Optional[gr.FileData]
-) -> Tuple[str, str]:
-    """Handles the initial processing of input."""
-    try:
-        extracted = process_input(mode, src_lang, text_input, audio_path, file_obj)
-        return extracted, ""
-    except Exception as e:
-        logger.error(f"Processing error: {e}")
-        return "", f"Error: {str(e)}"
-def handle_translate(extracted_text: str, src_lang: str, tgt_lang: str) -> str:
-    """Handles translation of extracted text."""
-    if not extracted_text.strip():
-        return "No input text to translate."
     try:
-        return translate_text(extracted_text, src_lang, tgt_lang, model_manager)
     except Exception as e:
-        logger.error(f"Translation error: {e}")
-        return f"Translation error: {str(e)}"
-# -------------------------------
-# Gradio Interface
-# -------------------------------
-with gr.Blocks(title="LocaleNLP Translator") as demo:
-    gr.Markdown("## 🌍 LocaleNLP Multi-language Translator")
-    gr.Markdown("Supports translation between English, Wolof, Hausa, and Darija. Audio input must be in English.")
-    with gr.Row():
-        input_mode = gr.Radio(choices=INPUT_MODES, label="Input Type", value="Text")
-        input_lang = gr.Dropdown(choices=SUPPORTED_LANGUAGES[:-1], label="Input Language", value="English")
-        output_lang = gr.Dropdown(choices=SUPPORTED_LANGUAGES, label="Output Language", value="Wolof")
-    input_text = gr.Textbox(label="Enter Text", lines=10, visible=True)
-    audio_input = gr.Audio(label="Upload Audio (.wav, .mp3, .m4a)", type="filepath", visible=False)
-    file_input = gr.File(file_types=SUPPORTED_FILE_TYPES, label="Upload Document", visible=False)
-    extracted_text = gr.Textbox(label="Extracted / Transcribed Text", lines=10, interactive=False)
-    translate_button = gr.Button("Translate")
-    output_text = gr.Textbox(label="Translated Text", lines=10, interactive=False)
-    input_mode.change(fn=update_visibility, inputs=input_mode, outputs=[input_text, audio_input, file_input, extracted_text, output_text])
-    translate_button.click(
-        fn=handle_process,
-        inputs=[input_mode, input_lang, input_text, audio_input, file_input],
-        outputs=[extracted_text, output_text]
-    ).then(
-        fn=handle_translate,
-        inputs=[extracted_text, input_lang, output_lang],
-        outputs=output_text
-    )
 if __name__ == "__main__":
-    demo.launch()

+"""
+LocaleNLP Translation Service
+============================
+A multi-language translation application supporting English, Wolof, Hausa, and Darija.
+Features text, audio, and document translation with a modern web interface.
+Author: LocaleNLP Team
+Version: 1.0.0
+"""
 import os
 import re
 import logging
+import tempfile
+from typing import Optional, Dict, Tuple, Any, Union
 from pathlib import Path
+from dataclasses import dataclass
+from enum import Enum
 import gradio as gr
 import torch
 import fitz  # PyMuPDF
 import docx
 from bs4 import BeautifulSoup
+from markdown import markdown
 import chardet
 from transformers import pipeline, MarianTokenizer, AutoModelForSeq2SeqLM
+from huggingface_hub import login
+# ================================
+# Configuration & Constants
+# ================================
+class Language(str, Enum):
+    """Supported languages for translation."""
+    ENGLISH = "English"
+    WOLOF = "Wolof"
+    HAUSA = "Hausa"
+    DARIJA = "Darija"
+class InputMode(str, Enum):
+    """Supported input modes."""
+    TEXT = "Text"
+    AUDIO = "Audio"
+    FILE = "File"
+@dataclass
+class ModelConfig:
+    """Configuration for translation models."""
+    model_name: str
+    language_tag: str
+# Language pair configurations
+TRANSLATION_MODELS: Dict[Tuple[Language, Language], ModelConfig] = {
+    (Language.ENGLISH, Language.WOLOF): ModelConfig(
+        "LocaleNLP/localenlp-eng-wol-0.03", ">>wol<<"
+    ),
+    (Language.WOLOF, Language.ENGLISH): ModelConfig(
+        "LocaleNLP/localenlp-wol-eng-0.03", ">>eng<<"
+    ),
+    (Language.ENGLISH, Language.HAUSA): ModelConfig(
+        "LocaleNLP/localenlp-eng-hau-0.01", ">>hau<<"
+    ),
+    (Language.HAUSA, Language.ENGLISH): ModelConfig(
+        "LocaleNLP/localenlp-hau-eng-0.01", ">>eng<<"
+    ),
+    (Language.ENGLISH, Language.DARIJA): ModelConfig(
+        "LocaleNLP/english_darija", ">>dar<<"
+    )
+}
+# File type support
+SUPPORTED_FILE_TYPES = [
+    ".pdf", ".docx", ".html", ".htm", ".md",
+    ".srt", ".txt", ".text"
+]
+# Audio file extensions
+AUDIO_EXTENSIONS = [".wav", ".mp3", ".m4a"]
+# ================================
+# Logging Configuration
+# ================================
+logging.basicConfig(
+    level=logging.INFO,
+    format='%(asctime)s - %(name)s - %(levelname)s - %(message)s'
+)
+logger = logging.getLogger(__name__)
+# ================================
+# Model Management
+# ================================
 class ModelManager:
+    """Centralized model management for translation and transcription."""
     def __init__(self):
+        self._translation_pipeline = None
+        self._whisper_model = None
+        self._current_model_name = None
+    def get_translation_pipeline(
+        self,
+        source_lang: Language,
+        target_lang: Language
+    ) -> Tuple[Any, str]:
+        """
+        Load and return translation pipeline for given language pair.
+        Args:
+            source_lang: Source language
+            target_lang: Target language
+        Returns:
+            Tuple of (pipeline, language_tag)
+        Raises:
+            ValueError: If language pair is not supported
+        """
+        key = (source_lang, target_lang)
+        if key not in TRANSLATION_MODELS:
+            raise ValueError(f"Unsupported translation pair: {source_lang} -> {target_lang}")
+        config = TRANSLATION_MODELS[key]
+        # Load model if not loaded or different model needed
+        if (self._translation_pipeline is None or
+            self._current_model_name != config.model_name):
+            logger.info(f"Loading translation model: {config.model_name}")
+            # Authenticate with Hugging Face if token provided
+            if hf_token := os.getenv("hffff"):
+                login(token=hf_token)
+            model = AutoModelForSeq2SeqLM.from_pretrained(
+                config.model_name,
+                token=hf_token
+            ).to(self._get_device())
+            tokenizer = MarianTokenizer.from_pretrained(
+                config.model_name,
+                token=hf_token
+            )
+            self._translation_pipeline = pipeline(
                 "translation",
                 model=model,
                 tokenizer=tokenizer,
+                device=0 if self._get_device().type == "cuda" else -1
             )
+            self._current_model_name = config.model_name
+        return self._translation_pipeline, config.language_tag
+    def get_whisper_model(self) -> Any:
+        """
+        Load and return Whisper transcription model.
+        Returns:
+            Whisper model instance
+        """
+        if self._whisper_model is None:
             logger.info("Loading Whisper base model...")
+            self._whisper_model = whisper.load_model("base")
+        return self._whisper_model
+    def _get_device(self) -> torch.device:
+        """Get appropriate device for model execution."""
+        return torch.device("cuda" if torch.cuda.is_available() else "cpu")
+# ================================
+# Content Processing
+# ================================
+class ContentProcessor:
+    """Handles extraction and processing of content from various sources."""
+    @staticmethod
+    def extract_text_from_file(file_path: Union[str, Path]) -> str:
+        """
+        Extract text content from various file formats.
+        Args:
+            file_path: Path to the file
+        Returns:
+            Extracted text content
+        Raises:
+            ValueError: If file type is unsupported
+            Exception: If file processing fails
+        """
+        file_path = Path(file_path)
+        extension = file_path.suffix.lower()
+        try:
+            content = file_path.read_bytes()
+            if extension == ".pdf":
+                return ContentProcessor._extract_pdf_text(content)
+            elif extension == ".docx":
+                return ContentProcessor._extract_docx_text(file_path)
+            elif extension in (".html", ".htm"):
+                return ContentProcessor._extract_html_text(content)
+            elif extension == ".md":
+                return ContentProcessor._extract_markdown_text(content)
+            elif extension == ".srt":
+                return ContentProcessor._extract_srt_text(content)
+            elif extension in (".txt", ".text"):
+                return ContentProcessor._extract_plain_text(content)
+            else:
+                raise ValueError(f"Unsupported file type: {extension}")
+        except Exception as e:
+            logger.error(f"Failed to extract text from {file_path}: {e}")
+            raise
+    @staticmethod
+    def _extract_pdf_text(content: bytes) -> str:
+        """Extract text from PDF file."""
         with fitz.open(stream=content, filetype="pdf") as doc:
             return "\n".join(page.get_text() for page in doc)
+    @staticmethod
+    def _extract_docx_text(file_path: Path) -> str:
+        """Extract text from DOCX file."""
+        doc = docx.Document(str(file_path))
+        return "\n".join(paragraph.text for paragraph in doc.paragraphs)
+    @staticmethod
+    def _extract_html_text(content: bytes) -> str:
+        """Extract text from HTML file."""
+        encoding = chardet.detect(content)["encoding"] or "utf-8"
+        text = content.decode(encoding, errors="ignore")
+        soup = BeautifulSoup(text, "html.parser")
+        return soup.get_text()
+    @staticmethod
+    def _extract_markdown_text(content: bytes) -> str:
+        """Extract text from Markdown file."""
+        encoding = chardet.detect(content)["encoding"] or "utf-8"
+        text = content.decode(encoding, errors="ignore")
+        html = markdown(text)
+        soup = BeautifulSoup(html, "html.parser")
+        return soup.get_text()
+    @staticmethod
+    def _extract_srt_text(content: bytes) -> str:
+        """Extract text from SRT subtitle file."""
+        encoding = chardet.detect(content)["encoding"] or "utf-8"
+        text = content.decode(encoding, errors="ignore")
+        # Remove timestamp lines
+        return re.sub(r"\d+\n\d{2}:\d{2}:\d{2},\d{3} --> .*?\n", "", text)
+    @staticmethod
+    def _extract_plain_text(content: bytes) -> str:
+        """Extract text from plain text file."""
+        encoding = chardet.detect(content)["encoding"] or "utf-8"
+        return content.decode(encoding, errors="ignore")
+# ================================
+# Translation Service
+# ================================
+class TranslationService:
+    """Core translation service with advanced processing capabilities."""
+    def __init__(self, model_manager: ModelManager):
+        self.model_manager = model_manager
+    def translate(
+        self,
+        text: str,
+        source_lang: Language,
+        target_lang: Language
+    ) -> str:
+        """
+        Translate text from source to target language.
+        Args:
+            text: Input text to translate
+            source_lang: Source language
+            target_lang: Target language
+        Returns:
+            Translated text
+        """
+        if not text.strip():
+            return "No input text to translate."
+        pipeline_obj, lang_tag = self.model_manager.get_translation_pipeline(
+            source_lang, target_lang
+        )
+        # Process text in paragraphs
+        paragraphs = text.splitlines()
+        translated_paragraphs = []
+        with torch.no_grad():
+            for paragraph in paragraphs:
+                if not paragraph.strip():
+                    translated_paragraphs.append("")
+                    continue
+                # Split into sentences and translate
+                sentences = [
+                    s.strip() for s in paragraph.split(". ")
+                    if s.strip()
+                ]
+                # Add language tag to each sentence
+                formatted_sentences = [
+                    f"{lang_tag} {sentence}"
+                    for sentence in sentences
+                ]
+                # Perform translation
+                results = pipeline_obj(
+                    formatted_sentences,
+                    max_length=5000,
+                    num_beams=5,
+                    early_stopping=True,
+                    no_repeat_ngram_size=3,
+                    repetition_penalty=1.5,
+                    length_penalty=1.2
+                )
+                # Process results
+                translated_sentences = [
+                    result["translation_text"].capitalize()
+                    for result in results
+                ]
+                translated_paragraphs.append(". ".join(translated_sentences))
+        return "\n".join(translated_paragraphs)
+# ================================
+# Audio Processing
+# ================================
+class AudioProcessor:
+    """Handles audio file transcription using Whisper."""
+    def __init__(self, model_manager: ModelManager):
+        self.model_manager = model_manager
+    def transcribe(self, audio_file_path: str) -> str:
+        """
+        Transcribe audio file to text.
+        Args:
+            audio_file_path: Path to audio file
+        Returns:
+            Transcribed text
+        """
+        model = self.model_manager.get_whisper_model()
+        result = model.transcribe(audio_file_path)
+        return result["text"]
+# ================================
+# Main Application
+# ================================
+class TranslationApp:
+    """Main application orchestrating all components."""
+    def __init__(self):
+        self.model_manager = ModelManager()
+        self.content_processor = ContentProcessor()
+        self.translation_service = TranslationService(self.model_manager)
+        self.audio_processor = AudioProcessor(self.model_manager)
+    def process_input(
+        self,
+        mode: InputMode,
+        source_lang: Language,
+        text_input: str,
+        audio_file: Optional[str],
+        file_obj: Optional[gr.FileData]
+    ) -> str:
+        """
+        Process input based on selected mode.
+        Args:
+            mode: Input mode
+            source_lang: Source language
+            text_input: Text input
+            audio_file: Audio file path
+            file_obj: Uploaded file object
+        Returns:
+            Processed text content
+        """
+        if mode == InputMode.TEXT:
+            return text_input
+        elif mode == InputMode.AUDIO:
+            if source_lang != Language.ENGLISH:
+                raise ValueError("Audio input must be in English.")
+            if not audio_file:
+                raise ValueError("No audio file provided.")
+            return self.audio_processor.transcribe(audio_file)
+        elif mode == InputMode.FILE:
+            if not file_obj:
+                raise ValueError("No file uploaded.")
+            return self.content_processor.extract_text_from_file(file_obj.name)
+        return ""
+    def create_interface(self) -> gr.Blocks:
+        """Create and return the Gradio interface."""
+        with gr.Blocks(
+            title="LocaleNLP Translation Service",
+            theme=gr.themes.Soft()
+        ) as interface:
+            # Header
+            gr.Markdown("""
+            # 🌍 LocaleNLP Translation Service
+            Translate between English, Wolof, Hausa, and Darija with support for text, audio, and documents.
+            """)
+            # Input controls
+            with gr.Row():
+                input_mode = gr.Radio(
+                    choices=[mode.value for mode in InputMode],
+                    label="Input Type",
+                    value=InputMode.TEXT.value
+                )
+                input_lang = gr.Dropdown(
+                    choices=[lang.value for lang in Language if lang != Language.DARIJA],
+                    label="Input Language",
+                    value=Language.ENGLISH.value
+                )
+                output_lang = gr.Dropdown(
+                    choices=[lang.value for lang in Language],
+                    label="Output Language",
+                    value=Language.WOLOF.value
+                )
+            # Input components
+            input_text = gr.Textbox(
+                label="Enter Text",
+                lines=8,
+                visible=True,
+                placeholder="Type or paste your text here..."
             )
+            audio_input = gr.Audio(
+                label="Upload Audio",
+                type="filepath",
+                visible=False
+            )
+            file_input = gr.File(
+                file_types=SUPPORTED_FILE_TYPES,
+                label="Upload Document",
+                visible=False
+            )
+            # Processing area
+            extracted_text = gr.Textbox(
+                label="Extracted / Transcribed Text",
+                lines=8,
+                interactive=False
+            )
+            translate_btn = gr.Button(
+                "🔄 Process & Translate",
+                variant="primary"
+            )
+            output_text = gr.Textbox(
+                label="Translated Text",
+                lines=8,
+                interactive=False
+            )
+            # Event handlers
+            def update_visibility(mode: str) -> Dict[str, Any]:
+                """Update component visibility based on input mode."""
+                return {
+                    input_text: gr.update(visible=(mode == InputMode.TEXT.value)),
+                    audio_input: gr.update(visible=(mode == InputMode.AUDIO.value)),
+                    file_input: gr.update(visible=(mode == InputMode.FILE.value)),
+                    extracted_text: gr.update(value="", visible=True),
+                    output_text: gr.update(value="")
+                }
+            def handle_process(
+                mode: str,
+                source_lang: str,
+                text_input: str,
+                audio_file: Optional[str],
+                file_obj: Optional[gr.FileData]
+            ) -> Tuple[str, str]:
+                """Handle initial input processing."""
+                try:
+                    processed_text = self.process_input(
+                        InputMode(mode),
+                        Language(source_lang),
+                        text_input,
+                        audio_file,
+                        file_obj
+                    )
+                    return processed_text, ""
+                except Exception as e:
+                    logger.error(f"Processing error: {e}")
+                    return "", f"❌ Error: {str(e)}"
+            def handle_translate(
+                extracted_text: str,
+                source_lang: str,
+                target_lang: str
+            ) -> str:
+                """Handle translation of processed text."""
+                if not extracted_text.strip():
+                    return "📝 No text to translate."
+                try:
+                    return self.translation_service.translate(
+                        extracted_text,
+                        Language(source_lang),
+                        Language(target_lang)
+                    )
+                except Exception as e:
+                    logger.error(f"Translation error: {e}")
+                    return f"❌ Translation error: {str(e)}"
+            # Connect events
+            input_mode.change(
+                fn=update_visibility,
+                inputs=input_mode,
+                outputs=[input_text, audio_input, file_input, extracted_text, output_text]
+            )
+            translate_btn.click(
+                fn=handle_process,
+                inputs=[input_mode, input_lang, input_text, audio_input, file_input],
+                outputs=[extracted_text, output_text]
+            ).then(
+                fn=handle_translate,
+                inputs=[extracted_text, input_lang, output_lang],
+                outputs=output_text
+            )
+        return interface
+# ================================
+# Application Entry Point
+# ================================
+def main():
+    """Main application entry point."""
     try:
+        app = TranslationApp()
+        interface = app.create_interface()
+        interface.launch(
+            server_name="0.0.0.0",
+            server_port=int(os.getenv("PORT", 7860)),
+            share=False
+        )
     except Exception as e:
+        logger.critical(f"Failed to start application: {e}")
+        raise
 if __name__ == "__main__":
+    main()