Spaces:
Running
Running
# -*- coding: utf-8 -*- | |
from ttsmms import TTS | |
import gradio as gr | |
ISO_CODES = {'Tachelhit': 'shi', | |
'Tarifit (Latin script)': 'rif-script_latin', | |
'Tarifit (Arabic script)': 'rif-script_arabic', | |
'Taqbaylit': 'kab', | |
'Tamasheq': 'taq', | |
'Tamajaq, Tawallammat (Tifinagh script)': 'ttq-script_tifinagh' | |
} | |
mapping = {'ɣ': 'ġ', | |
'v': 'ġ', | |
'c': 'š', | |
'x': 'ḫ', | |
'T': 'ṭ', | |
'S': 'ṣ', | |
'D': 'ḍ', | |
'H': 'ḥ', | |
'Z': 'ẓ', | |
'3': 'ε', | |
'7': 'ḥ', | |
'9': 'q', | |
'gh': 'ġ', | |
'kh': 'ḫ' | |
} | |
MODELS = {} | |
def tts(text, variant): | |
variant_code = ISO_CODES[variant] | |
if variant_code not in MODELS: | |
MODELS[variant_code] = TTS(variant_code) | |
model = MODELS[variant_code] | |
if variant_code == 'shi': | |
for key, value in mapping.items(): | |
text = text.replace(key, value) | |
audio = model.synthesis(text) | |
return (audio['sampling_rate'], audio['x']) | |
examples = [["Riɣ ad cceɣ s ufus kḍuɣ s inxar", "Tachelhit"], | |
["arraw n lhem yukr aɣ ihdumn nɣ", "Tachelhit"], | |
["wa tamɣart ma d ukan teskart ?", "Tachelhit"], | |
["ar d iṭṭar unẓar, ffuɣn d igḍaḍ, mmɣin d ijjign", "Tachelhit"], | |
["Egg lxir di timura, ad tafed di tiwwura.", "Tarifit (Latin script)"], | |
["Aqemmum iqnen ur ṯ-ttidfen izan.", "Tarifit (Latin script)"]] | |
description = "Text-to-speech for Tachelhit, Tarifit, Taqbaylit, Tamasheq and Tamajaq (Tawallammat)." | |
iface = gr.Interface( | |
fn=tts, | |
inputs=[ | |
gr.Textbox( | |
label="Text", | |
default="Text to synthesize.", | |
), | |
gr.Dropdown(label="Variant", choices=list(ISO_CODES.keys()), value="Tachelhit") | |
], | |
outputs=gr.Audio(label="Output", type="numpy"), | |
examples=examples, | |
title="🗣️ Tamazight Text-to-Speech with MMS (Massively Multilingual Speech) 🗣️", | |
description=description, | |
allow_flagging="manual", | |
flagging_options=['error', 'bad-quality', 'wrong-pronounciation'], | |
) | |
iface.launch() |