@ -19,6 +19,11 @@ data_info = {
"trans_filepath": "train/TRANS.txt",
"speak_func": preprocess_speaker_general
},
"aishell3":{
"subfolders": ["train/wav"],
"trans_filepath": "train/content.txt",
}
def preprocess_dataset(datasets_root: Path, out_dir: Path, n_processes: int,
@ -8,6 +8,7 @@ import argparse
recognized_datasets = [
"aidatatang_200zh",
"magicdata",
"aishell3"
]
if __name__ == "__main__":