Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
|
@@ -9,8 +9,8 @@ import numpy as np
|
|
| 9 |
|
| 10 |
import ChatTTS
|
| 11 |
|
| 12 |
-
import se_extractor
|
| 13 |
-
from api import ToneColorConverter
|
| 14 |
import soundfile
|
| 15 |
|
| 16 |
print("loading ChatTTS model...")
|
|
@@ -80,7 +80,7 @@ tone_color_converter.load_ckpt(f'{ckpt_converter_en}/checkpoint.pth')
|
|
| 80 |
def generate_audio(text, audio_ref, temperature, top_P, top_K, audio_seed_input, text_seed_input, refine_text_flag, refine_text_input):
|
| 81 |
save_path = "output.wav"
|
| 82 |
|
| 83 |
-
if audio_ref
|
| 84 |
# Run the base speaker tts
|
| 85 |
src_path = "tmp.wav"
|
| 86 |
text_data = chat_tts(text, temperature, top_P, top_K, audio_seed_input, text_seed_input, refine_text_flag, refine_text_input, src_path)
|
|
@@ -108,17 +108,19 @@ def generate_audio(text, audio_ref, temperature, top_P, top_K, audio_seed_input,
|
|
| 108 |
|
| 109 |
|
| 110 |
with gr.Blocks() as demo:
|
| 111 |
-
gr.Markdown("#
|
|
|
|
|
|
|
| 112 |
|
| 113 |
default_text = "Today a man knocked on my door and asked for a small donation toward the local swimming pool. I gave him a glass of water."
|
| 114 |
text_input = gr.Textbox(label="Input Text", lines=4, placeholder="Please Input Text...", value=default_text)
|
| 115 |
|
| 116 |
|
| 117 |
default_refine_text = "[oral_2][laugh_0][break_6]"
|
| 118 |
-
refine_text_checkbox = gr.Checkbox(label="Refine text
|
| 119 |
refine_text_input = gr.Textbox(label="Refine Prompt", lines=1, placeholder="Please Refine Prompt...", value=default_refine_text)
|
| 120 |
with gr.Column():
|
| 121 |
-
voice_ref = gr.Audio(label="
|
| 122 |
|
| 123 |
with gr.Row():
|
| 124 |
temperature_slider = gr.Slider(minimum=0.00001, maximum=1.0, step=0.00001, value=0.3, label="Audio temperature")
|
|
@@ -148,15 +150,12 @@ with gr.Blocks() as demo:
|
|
| 148 |
inputs=[text_input, voice_ref, temperature_slider, top_p_slider, top_k_slider, audio_seed_input, text_seed_input, refine_text_checkbox, refine_text_input],
|
| 149 |
outputs=[audio_output,text_output])
|
| 150 |
|
| 151 |
-
parser = argparse.ArgumentParser(description='ChatTTS
|
| 152 |
parser.add_argument('--server_name', type=str, default='0.0.0.0', help='Server name')
|
| 153 |
parser.add_argument('--server_port', type=int, default=8080, help='Server port')
|
| 154 |
args = parser.parse_args()
|
| 155 |
|
| 156 |
-
|
| 157 |
-
|
| 158 |
-
|
| 159 |
-
|
| 160 |
|
| 161 |
if __name__ == '__main__':
|
| 162 |
demo.launch()
|
|
|
|
| 9 |
|
| 10 |
import ChatTTS
|
| 11 |
|
| 12 |
+
import OpenVoice.se_extractor as se_extractor
|
| 13 |
+
from OpenVoice.api import ToneColorConverter
|
| 14 |
import soundfile
|
| 15 |
|
| 16 |
print("loading ChatTTS model...")
|
|
|
|
| 80 |
def generate_audio(text, audio_ref, temperature, top_P, top_K, audio_seed_input, text_seed_input, refine_text_flag, refine_text_input):
|
| 81 |
save_path = "output.wav"
|
| 82 |
|
| 83 |
+
if audio_ref != "" :
|
| 84 |
# Run the base speaker tts
|
| 85 |
src_path = "tmp.wav"
|
| 86 |
text_data = chat_tts(text, temperature, top_P, top_K, audio_seed_input, text_seed_input, refine_text_flag, refine_text_input, src_path)
|
|
|
|
| 108 |
|
| 109 |
|
| 110 |
with gr.Blocks() as demo:
|
| 111 |
+
gr.Markdown("# <center>🥳 ChatTTS x OpenVoice 🥳</center>")
|
| 112 |
+
gr.Markdown("## <center>🌟 Make it sound super natural and switch it up to any voice you want, nailing the mood and tone also!🌟 </center>")
|
| 113 |
+
gr.Markdown("### <center>💕 Slide on over to [linkin.love](https://linkin.love) for a chat-fest with your AI buds!💕</center>")
|
| 114 |
|
| 115 |
default_text = "Today a man knocked on my door and asked for a small donation toward the local swimming pool. I gave him a glass of water."
|
| 116 |
text_input = gr.Textbox(label="Input Text", lines=4, placeholder="Please Input Text...", value=default_text)
|
| 117 |
|
| 118 |
|
| 119 |
default_refine_text = "[oral_2][laugh_0][break_6]"
|
| 120 |
+
refine_text_checkbox = gr.Checkbox(label="Refine text", info="'oral' means add filler words, 'laugh' means add laughter, and 'break' means add a pause. (0-10) ", value=True)
|
| 121 |
refine_text_input = gr.Textbox(label="Refine Prompt", lines=1, placeholder="Please Refine Prompt...", value=default_refine_text)
|
| 122 |
with gr.Column():
|
| 123 |
+
voice_ref = gr.Audio(label="Reference Audio", info="Click on the ✎ button to upload your own target speaker audio", type="filepath", value="examples/speaker.mp3")
|
| 124 |
|
| 125 |
with gr.Row():
|
| 126 |
temperature_slider = gr.Slider(minimum=0.00001, maximum=1.0, step=0.00001, value=0.3, label="Audio temperature")
|
|
|
|
| 150 |
inputs=[text_input, voice_ref, temperature_slider, top_p_slider, top_k_slider, audio_seed_input, text_seed_input, refine_text_checkbox, refine_text_input],
|
| 151 |
outputs=[audio_output,text_output])
|
| 152 |
|
| 153 |
+
parser = argparse.ArgumentParser(description='ChatTTS-OpenVoice Launch')
|
| 154 |
parser.add_argument('--server_name', type=str, default='0.0.0.0', help='Server name')
|
| 155 |
parser.add_argument('--server_port', type=int, default=8080, help='Server port')
|
| 156 |
args = parser.parse_args()
|
| 157 |
|
| 158 |
+
# demo.launch(server_name=args.server_name, server_port=args.server_port, inbrowser=True)
|
|
|
|
|
|
|
|
|
|
| 159 |
|
| 160 |
if __name__ == '__main__':
|
| 161 |
demo.launch()
|