File size: 677 Bytes
98f685a
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
import os

from data_gen.tts.base_pre_align import BasePreAlign
import glob


class VCTKPreAlign(BasePreAlign):
    def meta_data(self):
        wav_fns = glob.glob(f'{self.raw_data_dir}/wav48/*/*.wav')
        for wav_fn in wav_fns:
            item_name = os.path.basename(wav_fn)[:-4]
            spk = item_name.split("_")[0]
            txt_fn = wav_fn.split("/")
            txt_fn[-1] = f'{item_name}.txt'
            txt_fn[-3] = f'txt'
            txt_fn = "/".join(txt_fn)
            if os.path.exists(txt_fn) and os.path.exists(wav_fn):
                yield item_name, wav_fn, (self.load_txt, txt_fn), spk


if __name__ == "__main__":
    VCTKPreAlign().process()