[dataset]support aishell3(tested)

This commit is contained in:
Nemo 2021-08-25 23:11:29 +08:00
parent 3084fdeb10
commit 0cc3f569fa
2 changed files with 6 additions and 0 deletions

View File

@ -19,6 +19,11 @@ data_info = {
"trans_filepath": "train/TRANS.txt", "trans_filepath": "train/TRANS.txt",
"speak_func": preprocess_speaker_general "speak_func": preprocess_speaker_general
}, },
"aishell3":{
"subfolders": ["train/wav"],
"trans_filepath": "train/content.txt",
"speak_func": preprocess_speaker_general
},
} }
def preprocess_dataset(datasets_root: Path, out_dir: Path, n_processes: int, def preprocess_dataset(datasets_root: Path, out_dir: Path, n_processes: int,

View File

@ -8,6 +8,7 @@ import argparse
recognized_datasets = [ recognized_datasets = [
"aidatatang_200zh", "aidatatang_200zh",
"magicdata", "magicdata",
"aishell3"
] ]
if __name__ == "__main__": if __name__ == "__main__":