diff --git a/egs/librispeech/ASR/local/.prepare_vox.py.swp b/egs/librispeech/ASR/local/.prepare_vox.py.swp index cce5c3800..0917789fb 100644 Binary files a/egs/librispeech/ASR/local/.prepare_vox.py.swp and b/egs/librispeech/ASR/local/.prepare_vox.py.swp differ diff --git a/egs/librispeech/ASR/local/prepare_vox.py b/egs/librispeech/ASR/local/prepare_vox.py index d956a61b5..ff1375758 100755 --- a/egs/librispeech/ASR/local/prepare_vox.py +++ b/egs/librispeech/ASR/local/prepare_vox.py @@ -59,10 +59,9 @@ def prepare_vox( # ) manifests = {} - subset = spk_id.split('_')[0] - spk_idx = spk_id.split('_')[1] + #dataset_parts = ["train", "dev", "test"] - dataset_parts = [spk_idx] + dataset_parts = [spk_id] if output_dir is not None: output_dir = Path(output_dir) output_dir.mkdir(parents=True, exist_ok=True) @@ -82,8 +81,7 @@ def prepare_vox( #part_file_names = list(map(lambda x: x.strip('.wav'), os.listdir(part_path))) part_file_names = sorted(glob.glob(str(part_path)+'/*.wav')) part_file_names = [name.split('/')[-1].replace('.wav', '') for name in part_file_names] - txt_path = os.path.join(corpus_dir, f"../{spk_idx}_texts") - print(txt_path) + txt_path = os.path.join(corpus_dir, f"../{spk_id}/texts") futures = [] for trans_path in tqdm(