audio-separator

Running

App Files Files Community

Politrees commited on Nov 10, 2024

Commit

e42de32

verified ·

1 Parent(s): b43d613

Update app.py

Browse files

Files changed (1) hide show

app.py +13 -8

app.py CHANGED Viewed

@@ -20,9 +20,10 @@ ROFORMER_MODELS = {
     'Mel-Roformer-Karaoke-Aufr33-Viperx.ckpt': 'mel_band_roformer_karaoke_aufr33_viperx_sdr_10.1956.ckpt',
     'Mel-Roformer-Denoise-Aufr33': 'denoise_mel_band_roformer_aufr33_sdr_27.9959.ckpt',
     'Mel-Roformer-Denoise-Aufr33-Aggr': 'denoise_mel_band_roformer_aufr33_aggr_sdr_27.9768.ckpt',
-    'MB-Roformer-Inst-v1 by Kim': 'melband_roformer_inst_v1.ckpt',
-    'MB-Roformer-InstVoc-Duality-v1 by Unwa': 'melband_roformer_instvoc_duality_v1.ckpt',
-    'MB-Roformer-InstVoc-Duality-v2 by Unwa': 'melband_roformer_instvox_duality_v2.ckpt',
 }
 MDX23C_MODELS = [
     'MDX23C_D1581.ckpt',
@@ -109,7 +110,7 @@ def print_message(input_file, model_name):
     """Prints information about the audio separation process."""
     base_name = os.path.splitext(os.path.basename(input_file))[0]
     print("\n")
-    print("🎵 PolUVR 🎵")
     print("Input audio:", base_name)
     print("Separation Model:", model_name)
     print("Audio Separation Process...")
@@ -323,15 +324,15 @@ with gr.Blocks(
     gr.HTML("<h1> 🎵 Audio-Separator 🎵 </h1>")
     with gr.Accordion("General settings", open=False):
         with gr.Group():
-            model_file_dir = gr.Textbox(value="/tmp/audio-separator-models/", label="Directory to cache model files", info="The directory where model files are stored.", placeholder="/tmp/audio-separator-models/", interactive=False)
             with gr.Row():
-                output_dir = gr.Textbox(value="output", label="File output directory", info="The directory where output files will be saved.", placeholder="output", interactive=False)
                 output_format = gr.Dropdown(value="wav", choices=["wav", "flac", "mp3"], label="Output Format", info="The format of the output audio file.")
             with gr.Row():
                 norm_threshold = gr.Slider(minimum=0.1, maximum=1, step=0.1, value=0.9, label="Normalization threshold", info="The threshold for audio normalization.")
                 amp_threshold = gr.Slider(minimum=0.1, maximum=1, step=0.1, value=0.6, label="Amplification threshold", info="The threshold for audio amplification.")
             with gr.Row():
-                batch_size = gr.Slider(minimum=1, maximum=16, step=1, value=1, label="Batch Size", info="Larger consumes more RAM but may process slightly faster.", interactive=False)
     with gr.Tab("Roformer"):
         with gr.Group():
@@ -520,4 +521,8 @@ with gr.Blocks(
         outputs=[demucs_stem1, demucs_stem2, demucs_stem3, demucs_stem4, demucs_stem5, demucs_stem6],
     )
-app.launch(share=True)

     'Mel-Roformer-Karaoke-Aufr33-Viperx.ckpt': 'mel_band_roformer_karaoke_aufr33_viperx_sdr_10.1956.ckpt',
     'Mel-Roformer-Denoise-Aufr33': 'denoise_mel_band_roformer_aufr33_sdr_27.9959.ckpt',
     'Mel-Roformer-Denoise-Aufr33-Aggr': 'denoise_mel_band_roformer_aufr33_aggr_sdr_27.9768.ckpt',
+    'MelBand Roformer Kim | Inst V1 by Unwa': 'melband_roformer_inst_v1.ckpt',
+    'MelBand Roformer Kim | Inst V2 by Unwa': 'melband_roformer_inst_v2.ckpt',
+    'MelBand Roformer Kim | InstVoc Duality V1 by Unwa': 'melband_roformer_instvoc_duality_v1.ckpt',
+    'MelBand Roformer Kim | InstVoc Duality V2 by Unwa': 'melband_roformer_instvox_duality_v2.ckpt',
 }
 MDX23C_MODELS = [
     'MDX23C_D1581.ckpt',
     """Prints information about the audio separation process."""
     base_name = os.path.splitext(os.path.basename(input_file))[0]
     print("\n")
+    print("🎵 Audio-Separator 🎵")
     print("Input audio:", base_name)
     print("Separation Model:", model_name)
     print("Audio Separation Process...")
     gr.HTML("<h1> 🎵 Audio-Separator 🎵 </h1>")
     with gr.Accordion("General settings", open=False):
         with gr.Group():
+            model_file_dir = gr.Textbox(value="/tmp/audio-separator-models/", label="Directory to cache model files", info="The directory where model files are stored.", placeholder="/tmp/audio-separator-models/")
             with gr.Row():
+                output_dir = gr.Textbox(value="output", label="File output directory", info="The directory where output files will be saved.", placeholder="output")
                 output_format = gr.Dropdown(value="wav", choices=["wav", "flac", "mp3"], label="Output Format", info="The format of the output audio file.")
             with gr.Row():
                 norm_threshold = gr.Slider(minimum=0.1, maximum=1, step=0.1, value=0.9, label="Normalization threshold", info="The threshold for audio normalization.")
                 amp_threshold = gr.Slider(minimum=0.1, maximum=1, step=0.1, value=0.6, label="Amplification threshold", info="The threshold for audio amplification.")
             with gr.Row():
+                batch_size = gr.Slider(minimum=1, maximum=16, step=1, value=1, label="Batch Size", info="Larger consumes more RAM but may process slightly faster.")
     with gr.Tab("Roformer"):
         with gr.Group():
         outputs=[demucs_stem1, demucs_stem2, demucs_stem3, demucs_stem4, demucs_stem5, demucs_stem6],
     )
+def main():
+    app.launch(share=True)
+if __name__ == "__main__":
+    main()