Spaces:

alibabasglab
/

ClearVoice

Runtime error

App Files Files Community

alibabasglab commited on Oct 17, 2024

Commit

4554491

verified ·

1 Parent(s): 8bb6908

Update app.py

Browse files

Files changed (1) hide show

app.py +13 -8

app.py CHANGED Viewed

@@ -3,8 +3,6 @@ import soundfile as sf
 import gradio as gr
 from clearvoice import ClearVoice
-#myClearVoice = ClearVoice(task='speech_enhancement', model_names=['FRCRN_SE_16K'])
 def fn_clearvoice_se(input_wav):
     myClearVoice = ClearVoice(task='speech_enhancement', model_names=['FRCRN_SE_16K'])
     output_wav_dict = myClearVoice(input_path=input_wav, online_write=False)
@@ -21,11 +19,16 @@ def fn_clearvoice_ss(input_wav):
     output_wav_dict = myClearVoice(input_path=input_wav, online_write=False)
     if isinstance(output_wav_dict, dict):
         key = next(iter(output_wav_dict))
-        output_wav = output_wav_dict[key]
     else:
-        output_wav = output_wav_dict
-    sf.write('separated_1.wav', output_wav, 16000)
-    return 'separated_1.wav'
 demo = gr.Blocks()
@@ -39,7 +42,8 @@ se_demo = gr.Interface(
     ],
     title = "ClearVoice: Speech Enhancement",
     description = ("Gradio demo for Speech enhancement with ClearVoice. To use it, simply upload your audio, or click one of the examples to load them. Read more at the links below."),
-    article = ("<p style='text-align: center'><a href='https://arxiv.org/abs/2206.07293' target='_blank'>FRCRN: Boosting Feature Representation Using Frequency Recurrence for Monaural Speech Enhancement</a> | <a href='https://github.com/speechbrain/speechbrain' target='_blank'>Github Repo</a></p>"),
     examples = [
         ['mandarin_speech.wav']
     ],
@@ -57,7 +61,8 @@ ss_demo = gr.Interface(
     ],
     title = "ClearVoice: Speech Separation",
     description = ("Gradio demo for Speech enhancement with ClearVoice. To use it, simply upload your audio, or click one of the examples to load them. Read more at the links below."),
-    article = ("<p style='text-align: center'><a href='https://arxiv.org/abs/2206.07293' target='_blank'>FRCRN: Boosting Feature Representation Using Frequency Recurrence for Monaural Speech Enhancement</a> | <a href='https://github.com/speechbrain/speechbrain' target='_blank'>Github Repo</a></p>"),
     examples = [
         ['mandarin_speech.wav']
     ],

 import gradio as gr
 from clearvoice import ClearVoice
 def fn_clearvoice_se(input_wav):
     myClearVoice = ClearVoice(task='speech_enhancement', model_names=['FRCRN_SE_16K'])
     output_wav_dict = myClearVoice(input_path=input_wav, online_write=False)
     output_wav_dict = myClearVoice(input_path=input_wav, online_write=False)
     if isinstance(output_wav_dict, dict):
         key = next(iter(output_wav_dict))
+        output_wav_list = output_wav_dict[key]
+        output_wav_s1 = output_wav_list[0]
+        output_wav_s2 = output_wav_list[1]
     else:
+        output_wav_list = output_wav_dict
+        output_wav_s1 = output_wav_list[0]
+        output_wav_s2 = output_wav_list[1]
+    sf.write('separated_s1.wav', output_wav_s1, 16000)
+    sf.write('separated_s2.wav', output_wav_s2, 16000)
+    return "separated_s1.wav", "separated_s2.wav"
 demo = gr.Blocks()
     ],
     title = "ClearVoice: Speech Enhancement",
     description = ("Gradio demo for Speech enhancement with ClearVoice. To use it, simply upload your audio, or click one of the examples to load them. Read more at the links below."),
+    article = ("<p style='text-align: center'><a href='https://arxiv.org/abs/2206.07293' target='_blank'>FRCRN: Boosting Feature Representation Using Frequency Recurrence for Monaural Speech Enhancement</a> | <a href='https://github.com/alibabasglab' target='_blank'>Github Repo</a></p>"
+              ),
     examples = [
         ['mandarin_speech.wav']
     ],
     ],
     title = "ClearVoice: Speech Separation",
     description = ("Gradio demo for Speech enhancement with ClearVoice. To use it, simply upload your audio, or click one of the examples to load them. Read more at the links below."),
+    article = ("<p style='text-align: center'><a href='https://arxiv.org/abs/2302.11824' target='_blank'>MossFormer: Pushing the Performance Limit of Monaural Speech Separation using Gated Single-Head Transformer with Convolution-Augmented Joint Self-Attentions</a> | <a href='https://github.com/alibabasglab' target='_blank'>Github Repo</a></p>"
+              "<p style='text-align: center'><a href='https://arxiv.org/abs/2312.11825' target='_blank'>MossFormer2: Combining Transformer and RNN-Free Recurrent Network for Enhanced Time-Domain Monaural Speech Separation</a> | <a href='https://github.com/alibabasglab' target='_blank'>Github Repo</a></p>"),
     examples = [
         ['mandarin_speech.wav']
     ],