Spaces:

AlexK-PL
/

Tacotron2_GST_eng

Sleeping

AlexK-PL commited on Sep 5, 2023

Commit

eec8d3d

1 Parent(s): 3ed419f

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -10,6 +10,7 @@ from melgan.utils.hparams import load_hparam
 import torch
 import numpy as np
 from matplotlib import pyplot as plt
 from matplotlib import gridspec
@@ -88,8 +89,19 @@ def synthesize(text, gst_1, gst_2, gst_3):
     return (22050, audio_numpy), fig_mel  # fig_align
-iface = gr.Interface(fn=synthesize, inputs=[gr.Textbox(label="Input Text"), gr.Slider(0.2, 0.45, label="First style token weight:"),
-                                            gr.Slider(0.2, 0.45, label="Second style token weight:"), gr.Slider(0.2, 0.45, label="Third style token weight:")],
                      outputs=[gr.Audio(label="Generated Speech", type="numpy"), gr.Plot(label="Output"),],
                      title="Single-Head Attention Tacotron2 with Style Tokens", description=DESCRIPTION)
 iface.launch()

 import torch
 import numpy as np
+import random
 from matplotlib import pyplot as plt
 from matplotlib import gridspec
     return (22050, audio_numpy), fig_mel  # fig_align
+def randomize_style_weights():
+    rand_weight_1 = random.randrange(0.3, 0.45, 0.01)
+    rand_weight_2 = random.randrange(0.3, 0.45, 0.01)
+    rand_weight_3 = 1.0 - (rand_weight_1 + rand_weight_2)
+    return rand_weight_1, rand_weight_2, rand_weight_3
+w1, w2, w3 = randomize_style_weights()
+iface = gr.Interface(fn=synthesize, inputs=[gr.Textbox(label="Input Text"), gr.Slider(0.2, 0.45, label="First style token weight:", value=w1),
+                                            gr.Slider(0.2, 0.45, label="Second style token weight:", value=w2),
+                                            gr.Slider(0.2, 0.45, label="Third style token weight:",value=w3)],
                      outputs=[gr.Audio(label="Generated Speech", type="numpy"), gr.Plot(label="Output"),],
                      title="Single-Head Attention Tacotron2 with Style Tokens", description=DESCRIPTION)
 iface.launch()