NeuML
/

ljspeech-vits-onnx

Model card Files Files and versions Community

davidmezzetti commited on Nov 29, 2022

Commit

d51b59a

•

1 Parent(s): db21534

Add model files

Files changed (3) hide show

README.md +30 -0
config.yaml +92 -0
model.onnx +3 -0

README.md CHANGED Viewed

@@ -1,3 +1,33 @@
 ---
 license: apache-2.0
 ---

 ---
+tags:
+- audio
+- text-to-speech
+- onnx
+inference: false
+language: en
+datasets:
+- ljspeech
 license: apache-2.0
 ---
+# ESPnet VITS Text-to-Speech (TTS) Model for ONNX
+[espnet/kan-bayashi_ljspeech_vits](https://huggingface.co/espnet/kan-bayashi_ljspeech_vits). This model is an ONNX export using the [espnet_onnx](https://github.com/espnet/espnet_onnx) library.
+## Usage with txtai
+txtai has a built in Text to Speech (TTS) pipeline that makes using this model easy.
+```python
+```
+## Usage with ONNX
+This model can also be run directly with ONNX provided the input text is tokenized. Tokenization can be done with [ttstokenizer](https://github.com/neuml/ttstokenizer).
+```python
+```
+## How to export
+More information on how to export ESPnet models to ONNX can be [found here](https://github.com/espnet/espnet_onnx#text2speech-inference).

config.yaml ADDED Viewed

	@@ -0,0 +1,92 @@

+normalize:
+  use_normalize: false
+text_cleaner:
+  cleaner_types: tacotron
+token:
+  list:
+  - <blank>
+  - <unk>
+  - AH0
+  - N
+  - T
+  - D
+  - S
+  - R
+  - L
+  - DH
+  - K
+  - Z
+  - IH1
+  - IH0
+  - M
+  - EH1
+  - W
+  - P
+  - AE1
+  - AH1
+  - V
+  - ER0
+  - F
+  - ','
+  - AA1
+  - B
+  - HH
+  - IY1
+  - UW1
+  - IY0
+  - AO1
+  - EY1
+  - AY1
+  - .
+  - OW1
+  - SH
+  - NG
+  - G
+  - ER1
+  - CH
+  - JH
+  - Y
+  - AW1
+  - TH
+  - UH1
+  - EH2
+  - OW0
+  - EY2
+  - AO0
+  - IH2
+  - AE2
+  - AY2
+  - AA2
+  - UW0
+  - EH0
+  - OY1
+  - EY0
+  - AO2
+  - ZH
+  - OW2
+  - AE0
+  - UW2
+  - AH2
+  - AY0
+  - IY2
+  - AW2
+  - AA0
+  - ''''
+  - ER2
+  - UH2
+  - '?'
+  - OY2
+  - '!'
+  - AW0
+  - UH0
+  - OY0
+  - ..
+  - <sos/eos>
+tokenizer:
+  g2p_type: g2p_en_no_space
+  token_type: phn
+tts_model:
+  model_path: espnet/kan-bayashi_ljspeech_vits/full/vits.onnx
+  model_type: VITS
+vocoder:
+  vocoder_type: not_used

model.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6d18b3b99099fcad3bf5b5c02cbc98f262483a72699a9e995833fffbdc445053
+size 137938668