Spaces:

soiz
/

mikuTTSAPI

Running

App Files Files Community

NoCrypt commited on Aug 13, 2023

Commit

087c3c2

1 Parent(s): 3971395

added back limitation

Browse files

Files changed (1) hide show

app.py +20 -12

app.py CHANGED Viewed

@@ -39,10 +39,8 @@ tts_voice_list = asyncio.get_event_loop().run_until_complete(edge_tts.list_voice
 tts_voices = [f"{v['ShortName']}-{v['Gender']}" for v in tts_voice_list]
 # RVC models
-model_root = snapshot_download(
-    repo_id="NoCrypt/miku_RVC", token=os.environ["TOKEN"])
-models = [d for d in os.listdir(
-    model_root) if os.path.isdir(f"{model_root}/{d}")]
 models.sort()
@@ -61,14 +59,12 @@ def model_data(model_name):
     version = cpt.get("version", "v1")
     if version == "v1":
         if if_f0 == 1:
-            net_g = SynthesizerTrnMs256NSFsid(
-                *cpt["config"], is_half=config.is_half)
         else:
             net_g = SynthesizerTrnMs256NSFsid_nono(*cpt["config"])
     elif version == "v2":
         if if_f0 == 1:
-            net_g = SynthesizerTrnMs768NSFsid(
-                *cpt["config"], is_half=config.is_half)
         else:
             net_g = SynthesizerTrnMs768NSFsid_nono(*cpt["config"])
     else:
@@ -133,9 +129,15 @@ def tts(
     print(tts_text)
     print(f"tts_voice: {tts_voice}, speed: {speed}")
     print(f"Model name: {model_name}")
-    print(
-        f"F0: {f0_method}, Key: {f0_up_key}, Index: {index_rate}, Protect: {protect}")
     try:
         t0 = time.time()
         if speed >= 0:
             speed_str = f"+{speed}%"
@@ -151,6 +153,13 @@ def tts(
         audio, sr = librosa.load(edge_output_filename, sr=16000, mono=True)
         duration = len(audio) / sr
         print(f"Audio duration: {duration}s")
         f0_up_key = int(f0_up_key)
         tgt_sr, net_g, vc, version, index_file, if_f0 = model_data(model_name)
@@ -265,8 +274,7 @@ with app:
                 step=10,
                 interactive=True,
             )
-            tts_text = gr.Textbox(label="Input Text",
-                                  value="こんにちは、私の名前は初音ミクです!")
         with gr.Column():
             but0 = gr.Button("Convert", variant="primary")
             info_text = gr.Textbox(label="Output info")

 tts_voices = [f"{v['ShortName']}-{v['Gender']}" for v in tts_voice_list]
 # RVC models
+model_root = snapshot_download(repo_id="NoCrypt/miku_RVC", token=os.environ["TOKEN"])
+models = [d for d in os.listdir(model_root) if os.path.isdir(f"{model_root}/{d}")]
 models.sort()
     version = cpt.get("version", "v1")
     if version == "v1":
         if if_f0 == 1:
+            net_g = SynthesizerTrnMs256NSFsid(*cpt["config"], is_half=config.is_half)
         else:
             net_g = SynthesizerTrnMs256NSFsid_nono(*cpt["config"])
     elif version == "v2":
         if if_f0 == 1:
+            net_g = SynthesizerTrnMs768NSFsid(*cpt["config"], is_half=config.is_half)
         else:
             net_g = SynthesizerTrnMs768NSFsid_nono(*cpt["config"])
     else:
     print(tts_text)
     print(f"tts_voice: {tts_voice}, speed: {speed}")
     print(f"Model name: {model_name}")
+    print(f"F0: {f0_method}, Key: {f0_up_key}, Index: {index_rate}, Protect: {protect}")
     try:
+        if limitation and len(tts_text) > 1000:
+            print("Error: Text too long")
+            return (
+                f"Text characters should be at most 1000 in this huggingface space, but got {len(tts_text)} characters.",
+                None,
+                None,
+            )
         t0 = time.time()
         if speed >= 0:
             speed_str = f"+{speed}%"
         audio, sr = librosa.load(edge_output_filename, sr=16000, mono=True)
         duration = len(audio) / sr
         print(f"Audio duration: {duration}s")
+        if limitation and duration >= 200:
+            print("Error: Audio too long")
+            return (
+                f"Audio should be less than 200 seconds in this huggingface space, but got {duration}s.",
+                edge_output_filename,
+                None,
+            )
         f0_up_key = int(f0_up_key)
         tgt_sr, net_g, vc, version, index_file, if_f0 = model_data(model_name)
                 step=10,
                 interactive=True,
             )
+            tts_text = gr.Textbox(label="Input Text", value="こんにちは、私の名前は初音ミクです!")
         with gr.Column():
             but0 = gr.Button("Convert", variant="primary")
             info_text = gr.Textbox(label="Output info")