mirror of
https://github.com/k2-fsa/icefall.git
synced 2025-08-08 09:32:20 +00:00
[egs] Add prefix when reading manifests due to recent lhotse changes (#382)
* [egs] Add prefix when reading manifests due to recent lhotse changes * Fix wenetspeech * Fix style issues
This commit is contained in:
parent
0e57b30495
commit
8c5722de8c
@ -53,7 +53,7 @@ def compute_fbank_aishell(num_mel_bins: int = 80):
|
||||
"test",
|
||||
)
|
||||
manifests = read_manifests_if_cached(
|
||||
dataset_parts=dataset_parts, output_dir=src_dir
|
||||
prefix="aishell", dataset_parts=dataset_parts, output_dir=src_dir
|
||||
)
|
||||
assert manifests is not None
|
||||
|
||||
|
@ -35,8 +35,7 @@ def preprocess_aidatatang_200zh():
|
||||
|
||||
logging.info("Loading manifest")
|
||||
manifests = read_manifests_if_cached(
|
||||
dataset_parts=dataset_parts,
|
||||
output_dir=src_dir,
|
||||
dataset_parts=dataset_parts, output_dir=src_dir, prefix="aidatatang"
|
||||
)
|
||||
assert len(manifests) > 0
|
||||
|
||||
|
@ -53,7 +53,7 @@ def compute_fbank_musan():
|
||||
)
|
||||
|
||||
manifests = read_manifests_if_cached(
|
||||
dataset_parts=dataset_parts, output_dir=src_dir
|
||||
prefix="musan", dataset_parts=dataset_parts, output_dir=src_dir
|
||||
)
|
||||
assert manifests is not None
|
||||
|
||||
|
@ -57,7 +57,7 @@ def compute_fbank_librispeech():
|
||||
"train-other-500",
|
||||
)
|
||||
manifests = read_manifests_if_cached(
|
||||
dataset_parts=dataset_parts, output_dir=src_dir
|
||||
prefix="librispeech", dataset_parts=dataset_parts, output_dir=src_dir
|
||||
)
|
||||
assert manifests is not None
|
||||
|
||||
|
@ -53,7 +53,7 @@ def compute_fbank_musan():
|
||||
"noise",
|
||||
)
|
||||
manifests = read_manifests_if_cached(
|
||||
dataset_parts=dataset_parts, output_dir=src_dir
|
||||
prefix="musan", dataset_parts=dataset_parts, output_dir=src_dir
|
||||
)
|
||||
assert manifests is not None
|
||||
|
||||
|
@ -65,7 +65,7 @@ def compute_fbank_musan():
|
||||
"noise",
|
||||
)
|
||||
manifests = read_manifests_if_cached(
|
||||
dataset_parts=dataset_parts, output_dir=src_dir
|
||||
prefix="musan", dataset_parts=dataset_parts, output_dir=src_dir
|
||||
)
|
||||
assert manifests is not None
|
||||
|
||||
|
@ -53,7 +53,7 @@ def compute_fbank_tedlium():
|
||||
)
|
||||
|
||||
manifests = read_manifests_if_cached(
|
||||
dataset_parts=dataset_parts, output_dir=src_dir
|
||||
prefix="tedlium", dataset_parts=dataset_parts, output_dir=src_dir
|
||||
)
|
||||
assert manifests is not None
|
||||
|
||||
|
@ -54,7 +54,7 @@ def compute_fbank_timit():
|
||||
"TEST",
|
||||
)
|
||||
manifests = read_manifests_if_cached(
|
||||
dataset_parts=dataset_parts, output_dir=src_dir
|
||||
prefix="timit", dataset_parts=dataset_parts, output_dir=src_dir
|
||||
)
|
||||
assert manifests is not None
|
||||
|
||||
|
@ -62,6 +62,7 @@ def preprocess_wenet_speech():
|
||||
dataset_parts=dataset_parts,
|
||||
output_dir=src_dir,
|
||||
suffix="jsonl.gz",
|
||||
prefix="wenetspeech",
|
||||
)
|
||||
assert manifests is not None
|
||||
|
||||
|
Loading…
x
Reference in New Issue
Block a user