mirror of
https://github.com/k2-fsa/icefall.git
synced 2025-08-08 17:42:21 +00:00
[egs] Add prefix when reading manifests due to recent lhotse changes (#382)
* [egs] Add prefix when reading manifests due to recent lhotse changes * Fix wenetspeech * Fix style issues
This commit is contained in:
parent
0e57b30495
commit
8c5722de8c
@ -53,7 +53,7 @@ def compute_fbank_aishell(num_mel_bins: int = 80):
|
|||||||
"test",
|
"test",
|
||||||
)
|
)
|
||||||
manifests = read_manifests_if_cached(
|
manifests = read_manifests_if_cached(
|
||||||
dataset_parts=dataset_parts, output_dir=src_dir
|
prefix="aishell", dataset_parts=dataset_parts, output_dir=src_dir
|
||||||
)
|
)
|
||||||
assert manifests is not None
|
assert manifests is not None
|
||||||
|
|
||||||
|
@ -35,8 +35,7 @@ def preprocess_aidatatang_200zh():
|
|||||||
|
|
||||||
logging.info("Loading manifest")
|
logging.info("Loading manifest")
|
||||||
manifests = read_manifests_if_cached(
|
manifests = read_manifests_if_cached(
|
||||||
dataset_parts=dataset_parts,
|
dataset_parts=dataset_parts, output_dir=src_dir, prefix="aidatatang"
|
||||||
output_dir=src_dir,
|
|
||||||
)
|
)
|
||||||
assert len(manifests) > 0
|
assert len(manifests) > 0
|
||||||
|
|
||||||
|
@ -53,7 +53,7 @@ def compute_fbank_musan():
|
|||||||
)
|
)
|
||||||
|
|
||||||
manifests = read_manifests_if_cached(
|
manifests = read_manifests_if_cached(
|
||||||
dataset_parts=dataset_parts, output_dir=src_dir
|
prefix="musan", dataset_parts=dataset_parts, output_dir=src_dir
|
||||||
)
|
)
|
||||||
assert manifests is not None
|
assert manifests is not None
|
||||||
|
|
||||||
|
@ -57,7 +57,7 @@ def compute_fbank_librispeech():
|
|||||||
"train-other-500",
|
"train-other-500",
|
||||||
)
|
)
|
||||||
manifests = read_manifests_if_cached(
|
manifests = read_manifests_if_cached(
|
||||||
dataset_parts=dataset_parts, output_dir=src_dir
|
prefix="librispeech", dataset_parts=dataset_parts, output_dir=src_dir
|
||||||
)
|
)
|
||||||
assert manifests is not None
|
assert manifests is not None
|
||||||
|
|
||||||
|
@ -53,7 +53,7 @@ def compute_fbank_musan():
|
|||||||
"noise",
|
"noise",
|
||||||
)
|
)
|
||||||
manifests = read_manifests_if_cached(
|
manifests = read_manifests_if_cached(
|
||||||
dataset_parts=dataset_parts, output_dir=src_dir
|
prefix="musan", dataset_parts=dataset_parts, output_dir=src_dir
|
||||||
)
|
)
|
||||||
assert manifests is not None
|
assert manifests is not None
|
||||||
|
|
||||||
|
@ -65,7 +65,7 @@ def compute_fbank_musan():
|
|||||||
"noise",
|
"noise",
|
||||||
)
|
)
|
||||||
manifests = read_manifests_if_cached(
|
manifests = read_manifests_if_cached(
|
||||||
dataset_parts=dataset_parts, output_dir=src_dir
|
prefix="musan", dataset_parts=dataset_parts, output_dir=src_dir
|
||||||
)
|
)
|
||||||
assert manifests is not None
|
assert manifests is not None
|
||||||
|
|
||||||
|
@ -53,7 +53,7 @@ def compute_fbank_tedlium():
|
|||||||
)
|
)
|
||||||
|
|
||||||
manifests = read_manifests_if_cached(
|
manifests = read_manifests_if_cached(
|
||||||
dataset_parts=dataset_parts, output_dir=src_dir
|
prefix="tedlium", dataset_parts=dataset_parts, output_dir=src_dir
|
||||||
)
|
)
|
||||||
assert manifests is not None
|
assert manifests is not None
|
||||||
|
|
||||||
|
@ -54,7 +54,7 @@ def compute_fbank_timit():
|
|||||||
"TEST",
|
"TEST",
|
||||||
)
|
)
|
||||||
manifests = read_manifests_if_cached(
|
manifests = read_manifests_if_cached(
|
||||||
dataset_parts=dataset_parts, output_dir=src_dir
|
prefix="timit", dataset_parts=dataset_parts, output_dir=src_dir
|
||||||
)
|
)
|
||||||
assert manifests is not None
|
assert manifests is not None
|
||||||
|
|
||||||
|
@ -62,6 +62,7 @@ def preprocess_wenet_speech():
|
|||||||
dataset_parts=dataset_parts,
|
dataset_parts=dataset_parts,
|
||||||
output_dir=src_dir,
|
output_dir=src_dir,
|
||||||
suffix="jsonl.gz",
|
suffix="jsonl.gz",
|
||||||
|
prefix="wenetspeech",
|
||||||
)
|
)
|
||||||
assert manifests is not None
|
assert manifests is not None
|
||||||
|
|
||||||
|
Loading…
x
Reference in New Issue
Block a user