Spaces:

stepfun-ai
/

Step-Audio-EditX

Running on Zero

xieli commited on 30 days ago

Commit

066d2f4

1 Parent(s): 5bdad28

feat: fix asr

Files changed (1) hide show

app.py CHANGED Viewed

@@ -170,6 +170,27 @@ def process_audio_with_gpu(audio_input, text_input, target_text, task_type, task
         logger.error(f"❌ Audio processing failed: {e}")
         raise
     # GPU automatically deallocated when function exits
 # Save audio to temporary directory
 def save_audio(audio_type, audio_data, sr, tmp_dir):
@@ -450,27 +471,6 @@ class EditxTab:
         value = None if len(choices) == 0 else choices[0]
         return gr.Dropdown(label="Sub-task", choices=choices, value=value)
-    @spaces.GPU(duration=30)
-    def transcribe_audio(self, audio_input, current_text):
-        """Transcribe audio using Whisper ASR when prompt text is empty"""
-        global whisper_asr
-        # Only transcribe if current text is empty
-        if current_text and current_text.strip():
-            return current_text  # Keep existing text
-        if not audio_input:
-            return ""  # No audio to transcribe
-        if whisper_asr is None:
-            initialize_whisper()
-        try:
-            # Transcribe audio
-            transcribed_text = whisper_asr(audio_input)
-            self.logger.info(f"Audio transcribed: {transcribed_text}")
-            return transcribed_text
-        except Exception as e:
-            self.logger.error(f"Failed to transcribe audio: {e}")
-            return ""
 def launch_demo(args, editx_tab):
     """Launch the gradio demo"""

         logger.error(f"❌ Audio processing failed: {e}")
         raise
     # GPU automatically deallocated when function exits
+@spaces.GPU(duration=30)
+def transcribe_audio(self, audio_input, current_text):
+    """Transcribe audio using Whisper ASR when prompt text is empty"""
+    global whisper_asr
+    # Only transcribe if current text is empty
+    if current_text and current_text.strip():
+        return current_text  # Keep existing text
+    if not audio_input:
+        return ""  # No audio to transcribe
+    if whisper_asr is None:
+        initialize_whisper()
+    try:
+        # Transcribe audio
+        transcribed_text = whisper_asr(audio_input)
+        self.logger.info(f"Audio transcribed: {transcribed_text}")
+        return transcribed_text
+    except Exception as e:
+        self.logger.error(f"Failed to transcribe audio: {e}")
+        return ""
 # Save audio to temporary directory
 def save_audio(audio_type, audio_data, sr, tmp_dir):
         value = None if len(choices) == 0 else choices[0]
         return gr.Dropdown(label="Sub-task", choices=choices, value=value)
 def launch_demo(args, editx_tab):
     """Launch the gradio demo"""