This commit is contained in:
zr_jin 2023-07-19 11:51:40 +08:00
parent 441aa37e00
commit c061307c90
2 changed files with 3 additions and 3 deletions

View File

@ -47,7 +47,7 @@ def get_parser():
parser.add_argument(
"--training-subset",
type=str,
default="L",
default="train_phase1",
help="The training subset for computing fbank feature.",
)
@ -93,7 +93,7 @@ def compute_fbank_kespeech_splits(args):
subset = args.training_subset
subset = str(subset)
num_splits = args.num_splits
output_dir = f"data/fbank/{subset}_split_{num_splits}"
output_dir = f"data/fbank/KeSpeech/{subset}_split_{num_splits}"
output_dir = Path(output_dir)
assert output_dir.exists(), f"{output_dir} does not exist!"

View File

@ -47,7 +47,7 @@ def has_no_oov(
def preprocess_kespeech():
src_dir = Path("data/manifests/KeSpeech")
output_dir = Path("data/fbank")
output_dir = Path("data/fbank/KeSpeech")
output_dir.mkdir(exist_ok=True)
# Note: By default, we preprocess all sub-parts.