Spaces:

alibabasglab
/

ClearVoice

Running on Zero

App Files Files Community

alibabasglab commited on Oct 17, 2024

Commit

b78b7d0

verified ·

1 Parent(s): 3192961

Update app.py

Browse files

Files changed (1) hide show

app.py +35 -4

app.py CHANGED Viewed

@@ -3,9 +3,10 @@ import soundfile as sf
 import gradio as gr
 from clearvoice import ClearVoice
-myClearVoice = ClearVoice(task='speech_enhancement', model_names=['FRCRN_SE_16K'])
-def fn_clearvoice(input_wav):
     output_wav_dict = myClearVoice(input_path=input_wav, online_write=False)
     if isinstance(output_wav_dict, dict):
         key = next(iter(output_wav_dict))
@@ -15,17 +16,46 @@ def fn_clearvoice(input_wav):
     sf.write('enhanced.wav', output_wav, 16000)
     return 'enhanced.wav'
 demo = gr.Blocks()
 se_demo = gr.Interface(
     fn=fn_clearvoice,
     inputs = [
         gr.Audio(label="Input Audio", type="filepath")
     ],
     outputs = [
         gr.Audio(label="Output Audio", type="filepath")
     ],
-    title = "ClearVoice",
     description = ("Gradio demo for Speech enhancement with ClearVoice. To use it, simply upload your audio, or click one of the examples to load them. Read more at the links below."),
     article = ("<p style='text-align: center'><a href='https://arxiv.org/abs/2206.07293' target='_blank'>FRCRN: Boosting Feature Representation Using Frequency Recurrence for Monaural Speech Enhancement</a> | <a href='https://github.com/speechbrain/speechbrain' target='_blank'>Github Repo</a></p>"),
     examples = [
@@ -33,6 +63,7 @@ se_demo = gr.Interface(
     ],
     cache_examples = True,
 )
 with demo:
-    gr.TabbedInterface([se_demo, se_demo], ["Speech Enhancement", "Speech Separation"])
 demo.launch()

 import gradio as gr
 from clearvoice import ClearVoice
+#myClearVoice = ClearVoice(task='speech_enhancement', model_names=['FRCRN_SE_16K'])
+def fn_clearvoice_se(input_wav):
+    myClearVoice = ClearVoice(task='speech_enhancement', model_names=['FRCRN_SE_16K'])
     output_wav_dict = myClearVoice(input_path=input_wav, online_write=False)
     if isinstance(output_wav_dict, dict):
         key = next(iter(output_wav_dict))
     sf.write('enhanced.wav', output_wav, 16000)
     return 'enhanced.wav'
+def fn_clearvoice_ss(input_wav):
+    myClearVoice = ClearVoice(task='speech_separation', model_names=['MossFormer2_SS_16K'])
+    output_wav_dict = myClearVoice(input_path=input_wav, online_write=False)
+    if isinstance(output_wav_dict, dict):
+        key = next(iter(output_wav_dict))
+        output_wav = output_wav_dict[key]
+    else:
+        output_wav = output_wav_dict
+    sf.write('separated_1.wav', output_wav, 16000)
+    return 'separated_1.wav'
 demo = gr.Blocks()
 se_demo = gr.Interface(
+    fn=fn_clearvoice_se,
+    inputs = [
+        gr.Audio(label="Input Audio", type="filepath")
+    ],
+    outputs = [
+        gr.Audio(label="Output Audio", type="filepath")
+    ],
+    title = "ClearVoice: Speech Enhancement",
+    description = ("Gradio demo for Speech enhancement with ClearVoice. To use it, simply upload your audio, or click one of the examples to load them. Read more at the links below."),
+    article = ("<p style='text-align: center'><a href='https://arxiv.org/abs/2206.07293' target='_blank'>FRCRN: Boosting Feature Representation Using Frequency Recurrence for Monaural Speech Enhancement</a> | <a href='https://github.com/speechbrain/speechbrain' target='_blank'>Github Repo</a></p>"),
+    examples = [
+        ['mandarin_speech.wav']
+    ],
+    cache_examples = True,
+)
+ss_demo = gr.Interface(
     fn=fn_clearvoice,
     inputs = [
         gr.Audio(label="Input Audio", type="filepath")
     ],
     outputs = [
         gr.Audio(label="Output Audio", type="filepath")
+        gr.Audio(label="Output Audio", type="filepath")
     ],
+    title = "ClearVoice: Speech Separation",
     description = ("Gradio demo for Speech enhancement with ClearVoice. To use it, simply upload your audio, or click one of the examples to load them. Read more at the links below."),
     article = ("<p style='text-align: center'><a href='https://arxiv.org/abs/2206.07293' target='_blank'>FRCRN: Boosting Feature Representation Using Frequency Recurrence for Monaural Speech Enhancement</a> | <a href='https://github.com/speechbrain/speechbrain' target='_blank'>Github Repo</a></p>"),
     examples = [
     ],
     cache_examples = True,
 )
 with demo:
+    gr.TabbedInterface([se_demo, ss_demo], ["Speech Enhancement", "Speech Separation"])
 demo.launch()