@@ -10,18 +10,18 @@ def get_text(path_to_script_file):
1010 return text
1111
1212
13- def make (root = 'data' , name = 'vlsp2020_train_set_02' , save = 'custom_data ' ):
13+ def make (root = 'data' , name = 'vlsp2020_train_set_02' , save = 'LJSpeech-1.1 ' ):
1414 if not os .path .isdir (os .path .join (root , save , 'wavs' )):
1515 os .mkdir (os .path .join (root , save , 'wavs' ))
1616 all_audio_file_paths = glob .glob (os .path .join (root , name ,"*.wav" ))
1717 all_script_file_paths = glob .glob (os .path .join (root , name ,"*.txt" ))
1818 for audio_file in tqdm (all_audio_file_paths ):
19- file_name = audio_file .split ('\\ ' )[- 1 ]
19+ file_name = audio_file .split ('/ ' )[- 1 ]
2020 os .rename (audio_file , os .path .join (root ,save ,"wavs" ,file_name ))
2121 with open (os .path .join (root ,save ,'metadata.csv' ), 'w' , encoding = 'UTF8' , newline = '' ) as f :
2222 writer = csv .writer (f , delimiter = "|" )
2323 for text_file in tqdm (all_script_file_paths ):
24- file_name = text_file .split ("\\ " )[- 1 ].split ("." )[0 ]
24+ file_name = text_file .split ("/ " )[- 1 ].split ("." )[0 ]
2525 text = get_text (text_file )
2626 row = [file_name ,text ,text ]
2727 writer .writerow (row )
0 commit comments