mirror of
https://github.com/k2-fsa/icefall.git
synced 2025-08-09 01:52:41 +00:00
Update train.py (#773)
Fix transducer lstm egs bug as mentioned in issue 579
This commit is contained in:
parent
070c77e724
commit
7eb2d0edb6
@ -629,18 +629,8 @@ def run(rank, world_size, args):
|
|||||||
# Keep only utterances with duration between 1 second and 20 seconds
|
# Keep only utterances with duration between 1 second and 20 seconds
|
||||||
return 1.0 <= c.duration <= 20.0
|
return 1.0 <= c.duration <= 20.0
|
||||||
|
|
||||||
num_in_total = len(train_cuts)
|
|
||||||
|
|
||||||
train_cuts = train_cuts.filter(remove_short_and_long_utt)
|
train_cuts = train_cuts.filter(remove_short_and_long_utt)
|
||||||
|
|
||||||
num_left = len(train_cuts)
|
|
||||||
num_removed = num_in_total - num_left
|
|
||||||
removed_percent = num_removed / num_in_total * 100
|
|
||||||
|
|
||||||
logging.info(f"Before removing short and long utterances: {num_in_total}")
|
|
||||||
logging.info(f"After removing short and long utterances: {num_left}")
|
|
||||||
logging.info(f"Removed {num_removed} utterances ({removed_percent:.5f}%)")
|
|
||||||
|
|
||||||
train_dl = librispeech.train_dataloaders(train_cuts)
|
train_dl = librispeech.train_dataloaders(train_cuts)
|
||||||
|
|
||||||
valid_cuts = librispeech.dev_clean_cuts()
|
valid_cuts = librispeech.dev_clean_cuts()
|
||||||
|
Loading…
x
Reference in New Issue
Block a user