NoCrypt commited on
Commit
087c3c2
·
1 Parent(s): 3971395

added back limitation

Browse files
Files changed (1) hide show
  1. app.py +20 -12
app.py CHANGED
@@ -39,10 +39,8 @@ tts_voice_list = asyncio.get_event_loop().run_until_complete(edge_tts.list_voice
39
  tts_voices = [f"{v['ShortName']}-{v['Gender']}" for v in tts_voice_list]
40
 
41
  # RVC models
42
- model_root = snapshot_download(
43
- repo_id="NoCrypt/miku_RVC", token=os.environ["TOKEN"])
44
- models = [d for d in os.listdir(
45
- model_root) if os.path.isdir(f"{model_root}/{d}")]
46
  models.sort()
47
 
48
 
@@ -61,14 +59,12 @@ def model_data(model_name):
61
  version = cpt.get("version", "v1")
62
  if version == "v1":
63
  if if_f0 == 1:
64
- net_g = SynthesizerTrnMs256NSFsid(
65
- *cpt["config"], is_half=config.is_half)
66
  else:
67
  net_g = SynthesizerTrnMs256NSFsid_nono(*cpt["config"])
68
  elif version == "v2":
69
  if if_f0 == 1:
70
- net_g = SynthesizerTrnMs768NSFsid(
71
- *cpt["config"], is_half=config.is_half)
72
  else:
73
  net_g = SynthesizerTrnMs768NSFsid_nono(*cpt["config"])
74
  else:
@@ -133,9 +129,15 @@ def tts(
133
  print(tts_text)
134
  print(f"tts_voice: {tts_voice}, speed: {speed}")
135
  print(f"Model name: {model_name}")
136
- print(
137
- f"F0: {f0_method}, Key: {f0_up_key}, Index: {index_rate}, Protect: {protect}")
138
  try:
 
 
 
 
 
 
 
139
  t0 = time.time()
140
  if speed >= 0:
141
  speed_str = f"+{speed}%"
@@ -151,6 +153,13 @@ def tts(
151
  audio, sr = librosa.load(edge_output_filename, sr=16000, mono=True)
152
  duration = len(audio) / sr
153
  print(f"Audio duration: {duration}s")
 
 
 
 
 
 
 
154
  f0_up_key = int(f0_up_key)
155
 
156
  tgt_sr, net_g, vc, version, index_file, if_f0 = model_data(model_name)
@@ -265,8 +274,7 @@ with app:
265
  step=10,
266
  interactive=True,
267
  )
268
- tts_text = gr.Textbox(label="Input Text",
269
- value="こんにちは、私の名前は初音ミクです!")
270
  with gr.Column():
271
  but0 = gr.Button("Convert", variant="primary")
272
  info_text = gr.Textbox(label="Output info")
 
39
  tts_voices = [f"{v['ShortName']}-{v['Gender']}" for v in tts_voice_list]
40
 
41
  # RVC models
42
+ model_root = snapshot_download(repo_id="NoCrypt/miku_RVC", token=os.environ["TOKEN"])
43
+ models = [d for d in os.listdir(model_root) if os.path.isdir(f"{model_root}/{d}")]
 
 
44
  models.sort()
45
 
46
 
 
59
  version = cpt.get("version", "v1")
60
  if version == "v1":
61
  if if_f0 == 1:
62
+ net_g = SynthesizerTrnMs256NSFsid(*cpt["config"], is_half=config.is_half)
 
63
  else:
64
  net_g = SynthesizerTrnMs256NSFsid_nono(*cpt["config"])
65
  elif version == "v2":
66
  if if_f0 == 1:
67
+ net_g = SynthesizerTrnMs768NSFsid(*cpt["config"], is_half=config.is_half)
 
68
  else:
69
  net_g = SynthesizerTrnMs768NSFsid_nono(*cpt["config"])
70
  else:
 
129
  print(tts_text)
130
  print(f"tts_voice: {tts_voice}, speed: {speed}")
131
  print(f"Model name: {model_name}")
132
+ print(f"F0: {f0_method}, Key: {f0_up_key}, Index: {index_rate}, Protect: {protect}")
 
133
  try:
134
+ if limitation and len(tts_text) > 1000:
135
+ print("Error: Text too long")
136
+ return (
137
+ f"Text characters should be at most 1000 in this huggingface space, but got {len(tts_text)} characters.",
138
+ None,
139
+ None,
140
+ )
141
  t0 = time.time()
142
  if speed >= 0:
143
  speed_str = f"+{speed}%"
 
153
  audio, sr = librosa.load(edge_output_filename, sr=16000, mono=True)
154
  duration = len(audio) / sr
155
  print(f"Audio duration: {duration}s")
156
+ if limitation and duration >= 200:
157
+ print("Error: Audio too long")
158
+ return (
159
+ f"Audio should be less than 200 seconds in this huggingface space, but got {duration}s.",
160
+ edge_output_filename,
161
+ None,
162
+ )
163
  f0_up_key = int(f0_up_key)
164
 
165
  tgt_sr, net_g, vc, version, index_file, if_f0 = model_data(model_name)
 
274
  step=10,
275
  interactive=True,
276
  )
277
+ tts_text = gr.Textbox(label="Input Text", value="こんにちは、私の名前は初音ミクです!")
 
278
  with gr.Column():
279
  but0 = gr.Button("Convert", variant="primary")
280
  info_text = gr.Textbox(label="Output info")