Reformatted streaming_decode.py with flake8

2025-08-10 10:32:17 +00:00 · 2025-01-15 01:11:29 +09:00 · 2025-01-15 01:11:29 +09:00 · 9ab3021640
commit 9ab3021640
parent b574e68bf4
1 changed files with 29 additions and 31 deletions
--- a/egs/reazonspeech/ASR/zipformer/streaming_decode.py
+++ b/egs/reazonspeech/ASR/zipformer/streaming_decode.py
@ -22,13 +22,14 @@ Usage:
 """
 import pdb
 import argparse
 import logging
 import math
 import os
 import pdb
 import subprocess as sp
 from pathlib import Path
 from typing import Dict, List, Optional, Tuple
 from tokenizer import Tokenizer
 import k2
 import numpy as np
@ -42,6 +43,7 @@ from streaming_beam_search import (
    greedy_search,
    modified_beam_search,
 )
 from tokenizer import Tokenizer
 from torch import Tensor, nn
 from torch.nn.utils.rnn import pad_sequence
 from train import add_model_arguments, get_model, get_params
@ -61,9 +63,6 @@ from icefall.utils import (
    write_error_stats,
 )
 import subprocess as sp
 import os
 LOG_EPS = math.log(1e-10)
@ -124,7 +123,7 @@ def get_parser():
        default="data/lang_bpe_500/bpe.model",
        help="Path to the BPE model",
    )
-    
+
    parser.add_argument(
        "--lang-dir",
        type=Path,
@ -449,14 +448,14 @@ def decode_one_chunk(
    feature_lens = []
    states = []
    processed_lens = []  # Used in fast-beam-search
-    
+
    for stream in decode_streams:
        feat, feat_len = stream.get_feature_frames(chunk_size * 2)
        features.append(feat)
        feature_lens.append(feat_len)
        states.append(stream.states)
        processed_lens.append(stream.done_frames)
-    
+
    feature_lens = torch.tensor(feature_lens, device=model.device)
    features = pad_sequence(features, batch_first=True, padding_value=LOG_EPS)
@ -518,9 +517,9 @@ def decode_one_chunk(
        decode_streams[i].states = states[i]
        decode_streams[i].done_frames += encoder_out_lens[i]
        # if decode_streams[i].done:
-            # finished_streams.append(i)
+        # finished_streams.append(i)
        finished_streams.append(i)
-    
+
    return finished_streams
@ -528,7 +527,7 @@ def decode_dataset(
    cuts: CutSet,
    params: AttributeDict,
    model: nn.Module,
-    sp: Tokenizer,
+    tokenizer: Tokenizer,
    decoding_graph: Optional[k2.Fsa] = None,
 ) -> Dict[str, List[Tuple[List[str], List[str]]]]:
    """Decode dataset.
@ -540,7 +539,7 @@ def decode_dataset(
        It is returned by :func:`get_params`.
      model:
        The neural model.
-      sp:
+      tokenizer:
        The BPE model.
      decoding_graph:
        The decoding graph. Can be either a `k2.trivial_graph` or HLG, Used
@ -608,7 +607,7 @@ def decode_dataset(
                    (
                        decode_streams[i].id,
                        decode_streams[i].ground_truth.split(),
-                        sp.decode(decode_streams[i].decoding_result()).split(),
+                        tokenizer.decode(decode_streams[i].decoding_result()).split(),
                    )
                )
                del decode_streams[i]
@ -628,21 +627,20 @@ def decode_dataset(
        )
        # print('INSIDE FOR LOOP ')
        # print(finished_streams)
-        
+
        if not finished_streams:
            print("No finished streams, breaking the loop")
            break
-    
+
        for i in sorted(finished_streams, reverse=True):
-            try: 
+            try:
                decode_results.append(
                    (
                        decode_streams[i].id,
                        decode_streams[i].ground_truth.split(),
-                        sp.decode(decode_streams[i].decoding_result()).split(),
+                        tokenizer.decode(decode_streams[i].decoding_result()).split(),
                    )
-                )  
+                )
                del decode_streams[i]
            except IndexError as e:
                print(f"IndexError: {e}")
@ -650,7 +648,7 @@ def decode_dataset(
                print(f"finished_streams: {finished_streams}")
                print(f"i: {i}")
                continue
-                
+
    if params.decoding_method == "greedy_search":
        key = "greedy_search"
    elif params.decoding_method == "fast_beam_search":
@ -663,7 +661,7 @@ def decode_dataset(
        key = f"num_active_paths_{params.num_active_paths}"
    else:
        raise ValueError(f"Unsupported decoding method: {params.decoding_method}")
-    torch.cuda.synchronize() 
+    torch.cuda.synchronize()
    return {key: decode_results}
@ -755,12 +753,12 @@ def main():
    logging.info(f"Device: {device}")
-    sp = Tokenizer.load(params.lang, params.lang_type)
+    sp_token = Tokenizer.load(params.lang, params.lang_type)
    # <blk> and <unk> is defined in local/train_bpe_model.py
-    params.blank_id = sp.piece_to_id("<blk>")
+    params.blank_id = sp_token.piece_to_id("<blk>")
-    params.unk_id = sp.piece_to_id("<unk>")
+    params.unk_id = sp_token.piece_to_id("<unk>")
-    params.vocab_size = sp.get_piece_size()
+    params.vocab_size = sp_token.get_piece_size()
    logging.info(params)
@ -854,11 +852,11 @@ def main():
    num_param = sum([p.numel() for p in model.parameters()])
    logging.info(f"Number of model parameters: {num_param}")
-    
+
    # we need cut ids to display recognition results.
    args.return_cuts = True
    reazonspeech_corpus = ReazonSpeechAsrDataModule(args)
-    
+
    valid_cuts = reazonspeech_corpus.valid_cuts()
    test_cuts = reazonspeech_corpus.test_cuts()
@ -870,7 +868,7 @@ def main():
            cuts=test_cut,
            params=params,
            model=model,
-            sp=sp,
+            tokenizer=sp_token,
            decoding_graph=decoding_graph,
        )
        save_results(
@ -878,9 +876,9 @@ def main():
            test_set_name=test_set,
            results_dict=results_dict,
        )
-    
+
    # valid_cuts = reazonspeech_corpus.valid_cuts()
-    
+
    # for valid_cut in valid_cuts:
    #     results_dict = decode_dataset(
    #         cuts=valid_cut,
@ -894,7 +892,7 @@ def main():
    #         test_set_name="valid",
    #         results_dict=results_dict,
    #     )
-        
+
    logging.info("Done!")