Spaces:

m6011
/

Najdi_TTS_Project

Build error

m6011 commited on Sep 13

Commit

c3cb969

•

1 Parent(s): 8a1a95a

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,26 +1,39 @@
 import gradio as gr
 from espnet2.bin.tts_inference import Text2Speech
-from transformers import AutoTokenizer, AutoModel
-# تحميل SaudiBERT لتحليل النص
-tokenizer = AutoTokenizer.from_pretrained("faisalq/SaudiBERT")
-model = AutoModel.from_pretrained("faisalq/SaudiBERT")
-# تحميل نموذج FastSpeech2
-tts = Text2Speech.from_pretrained("kan-bayashi/fastspeech2")
-# دالة لتحليل النص باستخدام SaudiBERT
-def analyze_text(text):
-    inputs = tokenizer(text, return_tensors="pt")
-    outputs = model(**inputs)
-    return text  # إعادة النص للتحويل بعد التحليل
 # دالة لتحويل النص إلى كلام
 def tts_najdi(text):
-    processed_text = analyze_text(text)
-    speech = tts(processed_text)
-    return speech['wav']
 # واجهة Gradio
-iface = gr.Interface(fn=tts_najdi, inputs="text", outputs="audio", title="FastSpeech2 Najdi TTS Model with SaudiBERT")
 iface.launch()

+# app.py
 import gradio as gr
+import torch
 from espnet2.bin.tts_inference import Text2Speech
+from espnet_model_zoo.downloader import ModelDownloader
+from transformers import AutoTokenizer
+# تحميل قائمة التوكينات
+with open('tokens.txt', 'r', encoding='utf-8') as f:
+    token_list = [line.strip() for line in f]
+# تحميل النموذج المدرب
+model_path = 'exp/tts_fastspeech2/train.total_count.ave_10best.pth'  # تأكد من مسار النموذج الصحيح
+config_path = 'exp/tts_fastspeech2/config.yaml'
+# إعداد Text2Speech
+device = 'cuda' if torch.cuda.is_available() else 'cpu'
+text2speech = Text2Speech.from_pretrained(
+    model_file=model_path,
+    config_file=config_path,
+    device=device,
+    threshold=0.5,
+    maxlenratio=10.0,
+    minlenratio=0.0,
+    use_att_constraint=False,
+    backward_window=1,
+    forward_window=3,
+)
 # دالة لتحويل النص إلى كلام
 def tts_najdi(text):
+    with torch.no_grad():
+        wav = text2speech(text)["wav"]
+    return wav.view(-1).cpu().numpy(), 22050  # تأكد من استخدام معدل العينة الصحيح
 # واجهة Gradio
+iface = gr.Interface(fn=tts_najdi, inputs="text", outputs="audio", title="Najdi TTS Model")
 iface.launch()