Spaces:
Runtime error
Runtime error
added extra params
Browse files
app.py
CHANGED
|
@@ -19,7 +19,7 @@ def load_model():
|
|
| 19 |
|
| 20 |
# Function to set up, generate, and process the audio
|
| 21 |
@spaces.GPU(duration=120) # Allocate GPU only when this function is called
|
| 22 |
-
def generate_audio(prompt, seconds_total=30, steps=100, cfg_scale=7):
|
| 23 |
print(f"Prompt received: {prompt}")
|
| 24 |
print(f"Settings: Duration={seconds_total}s, Steps={steps}, CFG Scale={cfg_scale}")
|
| 25 |
|
|
@@ -56,9 +56,9 @@ def generate_audio(prompt, seconds_total=30, steps=100, cfg_scale=7):
|
|
| 56 |
cfg_scale=cfg_scale,
|
| 57 |
conditioning=conditioning,
|
| 58 |
sample_size=sample_size,
|
| 59 |
-
sigma_min=
|
| 60 |
-
sigma_max=
|
| 61 |
-
sampler_type="dpmpp-3m-sde",
|
| 62 |
device=device
|
| 63 |
)
|
| 64 |
print("Audio generated.")
|
|
@@ -85,11 +85,16 @@ def generate_audio(prompt, seconds_total=30, steps=100, cfg_scale=7):
|
|
| 85 |
# Setting up the Gradio Interface
|
| 86 |
interface = gr.Interface(
|
| 87 |
fn=generate_audio,
|
|
|
|
| 88 |
inputs=[
|
| 89 |
gr.Textbox(label="Prompt", placeholder="Enter your text prompt here"),
|
|
|
|
| 90 |
gr.Slider(0, 47, value=30, label="Duration in Seconds"),
|
| 91 |
gr.Slider(10, 150, value=100, step=10, label="Number of Diffusion Steps"),
|
| 92 |
-
gr.Slider(1, 15, value=7, step=0.1, label="CFG Scale")
|
|
|
|
|
|
|
|
|
|
| 93 |
],
|
| 94 |
outputs=gr.Audio(type="filepath", label="Generated Audio"),
|
| 95 |
title="Stable Audio Generator",
|
|
|
|
| 19 |
|
| 20 |
# Function to set up, generate, and process the audio
|
| 21 |
@spaces.GPU(duration=120) # Allocate GPU only when this function is called
|
| 22 |
+
def generate_audio(prompt, sampler_type_dropdown, seconds_total=30, steps=100, cfg_scale=7,sigma_min_slider=0.3,sigma_max_slider=500):
|
| 23 |
print(f"Prompt received: {prompt}")
|
| 24 |
print(f"Settings: Duration={seconds_total}s, Steps={steps}, CFG Scale={cfg_scale}")
|
| 25 |
|
|
|
|
| 56 |
cfg_scale=cfg_scale,
|
| 57 |
conditioning=conditioning,
|
| 58 |
sample_size=sample_size,
|
| 59 |
+
sigma_min=sigma_min_slider,
|
| 60 |
+
sigma_max=sigma_max_slider,
|
| 61 |
+
sampler_type=sampler_type_dropdown,#"dpmpp-3m-sde",
|
| 62 |
device=device
|
| 63 |
)
|
| 64 |
print("Audio generated.")
|
|
|
|
| 85 |
# Setting up the Gradio Interface
|
| 86 |
interface = gr.Interface(
|
| 87 |
fn=generate_audio,
|
| 88 |
+
|
| 89 |
inputs=[
|
| 90 |
gr.Textbox(label="Prompt", placeholder="Enter your text prompt here"),
|
| 91 |
+
gr.Dropdown(["dpmpp-2m-sde", "dpmpp-3m-sde", "k-heun", "k-lms", "k-dpmpp-2s-ancestral", "k-dpm-2", "k-dpm-fast"], label="Sampler type", value="dpmpp-3m-sde"),
|
| 92 |
gr.Slider(0, 47, value=30, label="Duration in Seconds"),
|
| 93 |
gr.Slider(10, 150, value=100, step=10, label="Number of Diffusion Steps"),
|
| 94 |
+
gr.Slider(1, 15, value=7, step=0.1, label="CFG Scale"),
|
| 95 |
+
gr.Slider(minimum=0.0, maximum=5.0, step=0.01, value=0.3, label="Sigma min"),
|
| 96 |
+
gr.Slider(minimum=0.0, maximum=1000.0, step=0.1, value=500, label="Sigma max"),
|
| 97 |
+
|
| 98 |
],
|
| 99 |
outputs=gr.Audio(type="filepath", label="Generated Audio"),
|
| 100 |
title="Stable Audio Generator",
|