[egs] Add prefix when reading manifests due to recent lhotse changes (#382)

* [egs] Add prefix when reading manifests due to recent lhotse changes

* Fix wenetspeech

* Fix style issues
This commit is contained in:
Ewald Enzinger 2022-05-23 17:37:35 +02:00 committed by GitHub
parent 0e57b30495
commit 8c5722de8c
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
9 changed files with 9 additions and 9 deletions

View File

@ -53,7 +53,7 @@ def compute_fbank_aishell(num_mel_bins: int = 80):
"test",
)
manifests = read_manifests_if_cached(
dataset_parts=dataset_parts, output_dir=src_dir
prefix="aishell", dataset_parts=dataset_parts, output_dir=src_dir
)
assert manifests is not None

View File

@ -35,8 +35,7 @@ def preprocess_aidatatang_200zh():
logging.info("Loading manifest")
manifests = read_manifests_if_cached(
dataset_parts=dataset_parts,
output_dir=src_dir,
dataset_parts=dataset_parts, output_dir=src_dir, prefix="aidatatang"
)
assert len(manifests) > 0

View File

@ -53,7 +53,7 @@ def compute_fbank_musan():
)
manifests = read_manifests_if_cached(
dataset_parts=dataset_parts, output_dir=src_dir
prefix="musan", dataset_parts=dataset_parts, output_dir=src_dir
)
assert manifests is not None

View File

@ -57,7 +57,7 @@ def compute_fbank_librispeech():
"train-other-500",
)
manifests = read_manifests_if_cached(
dataset_parts=dataset_parts, output_dir=src_dir
prefix="librispeech", dataset_parts=dataset_parts, output_dir=src_dir
)
assert manifests is not None

View File

@ -53,7 +53,7 @@ def compute_fbank_musan():
"noise",
)
manifests = read_manifests_if_cached(
dataset_parts=dataset_parts, output_dir=src_dir
prefix="musan", dataset_parts=dataset_parts, output_dir=src_dir
)
assert manifests is not None

View File

@ -65,7 +65,7 @@ def compute_fbank_musan():
"noise",
)
manifests = read_manifests_if_cached(
dataset_parts=dataset_parts, output_dir=src_dir
prefix="musan", dataset_parts=dataset_parts, output_dir=src_dir
)
assert manifests is not None

View File

@ -53,7 +53,7 @@ def compute_fbank_tedlium():
)
manifests = read_manifests_if_cached(
dataset_parts=dataset_parts, output_dir=src_dir
prefix="tedlium", dataset_parts=dataset_parts, output_dir=src_dir
)
assert manifests is not None

View File

@ -54,7 +54,7 @@ def compute_fbank_timit():
"TEST",
)
manifests = read_manifests_if_cached(
dataset_parts=dataset_parts, output_dir=src_dir
prefix="timit", dataset_parts=dataset_parts, output_dir=src_dir
)
assert manifests is not None

View File

@ -62,6 +62,7 @@ def preprocess_wenet_speech():
dataset_parts=dataset_parts,
output_dir=src_dir,
suffix="jsonl.gz",
prefix="wenetspeech",
)
assert manifests is not None