Spaces:

amaai-lab
/

SonicMaster

Running on Zero

App Files Files Community

ambujm22 commited on Aug 22

Commit

c6d1d61

verified ·

1 Parent(s): 5bce909

Update app.py

Browse files

Files changed (1) hide show

app.py +97 -21

app.py CHANGED Viewed

@@ -2,7 +2,7 @@
 import os
 os.environ.setdefault("GRADIO_USE_CDN", "true")
-# Optional: 'spaces' is present on Spaces; harmless to try locally.
 try:
     import spaces
 except Exception:
@@ -25,14 +25,14 @@ def gpu_echo(x: str = "ok"):
 import sys
 import subprocess
 from pathlib import Path
-from typing import Tuple, Optional, List
 import gradio as gr
 import numpy as np
 import soundfile as sf
 from huggingface_hub import hf_hub_download
-# ZeroGPU runtime hint (still safe on CPU)
 USE_ZEROGPU = os.getenv("SPACE_RUNTIME", "").lower() == "zerogpu"
 SPACE_ROOT   = Path(__file__).parent.resolve()
@@ -140,7 +140,7 @@ def run_sonicmaster_cli(
     return False, last_err or "All candidate commands failed."
 # ========== GPU path (called only if ZeroGPU/GPU available) ==========
-@spaces.GPU(duration=180)
 def enhance_on_gpu(input_path: str, prompt: str, output_path: str) -> Tuple[bool, str]:
     try:
         import torch  # noqa: F401
@@ -156,6 +156,56 @@ def _has_cuda() -> bool:
     except Exception:
         return False
 # ========== Gradio callback ==========
 def enhance_audio_ui(
     audio_path: str,
@@ -202,33 +252,59 @@ def enhance_audio_ui(
         return None, f"Unexpected error: {e}\n{traceback.format_exc()}"
 # ========== Gradio UI ==========
-PROMPT_EXAMPLES = [
-    ["Increase the clarity of this song by emphasizing treble frequencies."],
-    ["Make this song sound more boomy by amplifying the low end bass frequencies."],
-    ["Make the audio smoother and less distorted."],
-    ["Improve the balance in this song."],
-    ["Reduce roominess/echo (dereverb)."],
-    ["Raise the level of the vocals."],
-    ["Give the song a wider stereo image."],
-]
 with gr.Blocks(title="SonicMaster – Text-Guided Restoration & Mastering", fill_height=True) as _demo:
     gr.Markdown(
         "## 🎧 SonicMaster\n"
-        "Upload or choose an example prompt, write your own instruction, then click **Enhance**.\n"
-        "- First run downloads model weights & repo (progress will show).\n"
-        "- On failure, the **Status** box shows the exact error (we won't echo the input audio)."
     )
     with gr.Row():
-        with gr.Column():
             in_audio = gr.Audio(label="Input Audio", type="filepath")
             prompt   = gr.Textbox(label="Text Prompt", placeholder="e.g., Reduce reverb and brighten vocals.")
             run_btn  = gr.Button("🚀 Enhance", variant="primary")
-            gr.Examples(examples=PROMPT_EXAMPLES, inputs=[prompt], label="Prompt Examples")
-        with gr.Column():
             out_audio = gr.Audio(label="Enhanced Audio (output)")
             status    = gr.Textbox(label="Status / Messages", interactive=False, lines=8)
     run_btn.click(
         fn=enhance_audio_ui,
         inputs=[in_audio, prompt],
@@ -243,4 +319,4 @@ app = demo
 # Local debugging only
 if __name__ == "__main__":
-    demo.launch(server_name="0.0.0.0", server_port=7860)

 import os
 os.environ.setdefault("GRADIO_USE_CDN", "true")
+# Optional: 'spaces' present on Spaces; harmless to try locally.
 try:
     import spaces
 except Exception:
 import sys
 import subprocess
 from pathlib import Path
+from typing import Tuple, Optional, List, Dict, Any
 import gradio as gr
 import numpy as np
 import soundfile as sf
 from huggingface_hub import hf_hub_download
+# ZeroGPU runtime hint (safe on CPU)
 USE_ZEROGPU = os.getenv("SPACE_RUNTIME", "").lower() == "zerogpu"
 SPACE_ROOT   = Path(__file__).parent.resolve()
     return False, last_err or "All candidate commands failed."
 # ========== GPU path (called only if ZeroGPU/GPU available) ==========
+@spaces.GPU(duration=60)
 def enhance_on_gpu(input_path: str, prompt: str, output_path: str) -> Tuple[bool, str]:
     try:
         import torch  # noqa: F401
     except Exception:
         return False
+# ========== Examples (lazy) ==========
+PROMPTS_10 = [
+    "Increase the clarity of this song by emphasizing treble frequencies.",
+    "Make this song sound more boomy by amplifying the low end bass frequencies.",
+    "Can you make this sound louder, please?",
+    "Make the audio smoother and less distorted.",
+    "Improve the balance in this song.",
+    "Disentangle the left and right channels to give this song a stereo feeling.",
+    "Correct the unnatural frequency emphasis. Reduce the roominess or echo.",
+    "Raise the level of the vocals, please.",
+    "Increase the clarity of this song by emphasizing treble frequencies.",
+    "Please, dereverb this audio.",
+]
+def list_example_files(progress: Optional[gr.Progress] = None) -> List[str]:
+    """Return up to 10 .wav paths inside repo/samples/inputs (lazy clone)."""
+    repo = ensure_repo(progress=progress)
+    wav_dir = repo / "samples" / "inputs"
+    files = sorted(p for p in wav_dir.glob("*.wav") if p.is_file())
+    return [p.as_posix() for p in files[:10]]
+def load_examples(_: Any = None, progress=gr.Progress()) -> Dict[str, Any]:
+    """Button/auto-load handler: populate dropdown choices and status text."""
+    paths = list_example_files(progress=progress)
+    if not paths:
+        return {
+            "choices": [],
+            "status": "No sample .wav files found in repo/samples/inputs.",
+        }
+    labels = [f"{i+1:02d} — {Path(p).name}" for i, p in enumerate(paths)]
+    return {
+        "choices": labels,
+        "paths": paths,
+        "status": f"Loaded {len(paths)} sample audios."
+    }
+def set_example_selection(idx_label: str, paths: List[str]) -> Tuple[str, str]:
+    """When user picks an example, set the audio path + a suggested prompt."""
+    if not idx_label or not paths:
+        return "", ""
+    try:
+        # label "01 — file.wav" -> index 0
+        idx = int(idx_label.split()[0]) - 1
+    except Exception:
+        idx = 0
+    idx = max(0, min(idx, len(paths)-1))
+    audio_path = paths[idx]
+    prompt = PROMPTS_10[idx] if idx < len(PROMPTS_10) else PROMPTS_10[-1]
+    return audio_path, prompt
 # ========== Gradio callback ==========
 def enhance_audio_ui(
     audio_path: str,
         return None, f"Unexpected error: {e}\n{traceback.format_exc()}"
 # ========== Gradio UI ==========
 with gr.Blocks(title="SonicMaster – Text-Guided Restoration & Mastering", fill_height=True) as _demo:
     gr.Markdown(
         "## 🎧 SonicMaster\n"
+        "Upload audio or **load sample audios**, write a prompt, then click **Enhance**.\n"
+        "- On failure, the **Status** box shows the exact error "
     )
     with gr.Row():
+        with gr.Column(scale=1):
+            # Sample loader (lazy)
+            with gr.Accordion("Sample audios (10)", open=False):
+                load_btn = gr.Button("📥 Load 10 sample audios")
+                samples_dropdown = gr.Dropdown(choices=[], label="Pick a sample", interactive=True)
+                samples_state = gr.State([])  # holds absolute paths
             in_audio = gr.Audio(label="Input Audio", type="filepath")
             prompt   = gr.Textbox(label="Text Prompt", placeholder="e.g., Reduce reverb and brighten vocals.")
             run_btn  = gr.Button("🚀 Enhance", variant="primary")
+            # Optional quick prompt examples (text-only)
+            gr.Examples(
+                examples=[[p] for p in [
+                    "Reduce roominess/echo (dereverb).",
+                    "Raise the level of the vocals.",
+                    "Give the song a wider stereo image.",
+                ]],
+                inputs=[prompt],
+                label="Prompt Examples",
+            )
+        with gr.Column(scale=1):
             out_audio = gr.Audio(label="Enhanced Audio (output)")
             status    = gr.Textbox(label="Status / Messages", interactive=False, lines=8)
+    # --- Wire up the sample loader ---
+    # 1) Load samples on button click (lazy clone)
+    load_result = load_btn.click(
+        fn=load_examples,
+        inputs=None,
+        outputs=None
+    )
+    # Manually map the dict result to components via .then (Gradio v5 API)
+    load_result.then(lambda d: d.get("choices", []), None, samples_dropdown)
+    load_result.then(lambda d: d.get("paths", []),   None, samples_state)
+    load_result.then(lambda d: d.get("status", ""),  None, status)
+    # 2) When a sample is chosen, set audio path + suggested prompt
+    samples_dropdown.change(
+        fn=set_example_selection,
+        inputs=[samples_dropdown, samples_state],
+        outputs=[in_audio, prompt],
+    )
+    # --- Enhance button ---
     run_btn.click(
         fn=enhance_audio_ui,
         inputs=[in_audio, prompt],
 # Local debugging only
 if __name__ == "__main__":
+    demo.launch(server_name="0.0.0.0", server_port=7860)