mirror of
https://github.com/k2-fsa/icefall.git
synced 2025-08-09 10:02:22 +00:00
optimize with num_jobs on save_audios
This commit is contained in:
parent
88249f0eb4
commit
547f5c5cfb
@ -120,6 +120,11 @@ def main():
|
|||||||
cut_sets = make_cutset_blueprints(mls_eng_hf_dataset_path)
|
cut_sets = make_cutset_blueprints(mls_eng_hf_dataset_path)
|
||||||
for part, cut_set in cut_sets:
|
for part, cut_set in cut_sets:
|
||||||
logging.info(f"Processing {part}")
|
logging.info(f"Processing {part}")
|
||||||
|
cut_set = cut_set.save_audios(
|
||||||
|
num_jobs=num_jobs,
|
||||||
|
storage_path=(args.audio_dir / part).as_posix(),
|
||||||
|
) # makes new cutset that loads audio from paths to actual audio files
|
||||||
|
|
||||||
cut_set = cut_set.compute_and_store_features(
|
cut_set = cut_set.compute_and_store_features(
|
||||||
extractor=extractor,
|
extractor=extractor,
|
||||||
num_jobs=num_jobs,
|
num_jobs=num_jobs,
|
||||||
@ -127,7 +132,6 @@ def main():
|
|||||||
storage_type=LilcomChunkyWriter,
|
storage_type=LilcomChunkyWriter,
|
||||||
)
|
)
|
||||||
|
|
||||||
cut_set = cut_set.save_audios(args.audio_dir / part) # makes new cutset that uses paths to actual audio files
|
|
||||||
cut_set.to_file(args.manifest_dir / f"mls_eng_cuts_{part}.jsonl.gz")
|
cut_set.to_file(args.manifest_dir / f"mls_eng_cuts_{part}.jsonl.gz")
|
||||||
|
|
||||||
logging.info("All fbank computed for MLS English.")
|
logging.info("All fbank computed for MLS English.")
|
||||||
|
Loading…
x
Reference in New Issue
Block a user