Update egs/librispeech/ASR/pruned_transducer_stateless6/hubert_xlarge.py

Co-authored-by: Fangjun Kuang <csukuangfj@gmail.com>
This commit is contained in:
LIyong.Guo 2022-05-27 11:23:43 +08:00 committed by GitHub
parent 91432397cf
commit 6fff82b917
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23

View File

@ -178,9 +178,7 @@ class HubertXlargeFineTuned:
N = encoder_embedding.shape[0]
assert len(cut_list) == N
# 320 is from: 16,000 / 50 = sample_rate / hbuert output frame rate
num_frames = [
supervisions["num_samples"][i].item() // 320 for i in range(N)
]
num_frames = (supervisions["num_samples"] // 320).tolist()
return encoder_embedding, num_frames
def ctc_greedy_search(self, batch):