From 28bd9330d7a229dc8d7acd7054662edf9c50cbb6 Mon Sep 17 00:00:00 2001 From: zr_jin Date: Tue, 22 Oct 2024 22:05:49 +0800 Subject: [PATCH] minor fixes --- egs/tokenizer/CODEC/encodec/codec_datamodule.py | 2 +- egs/tokenizer/CODEC/encodec/loss.py | 5 ++--- 2 files changed, 3 insertions(+), 4 deletions(-) diff --git a/egs/tokenizer/CODEC/encodec/codec_datamodule.py b/egs/tokenizer/CODEC/encodec/codec_datamodule.py index 6f4661995..5de39678a 100644 --- a/egs/tokenizer/CODEC/encodec/codec_datamodule.py +++ b/egs/tokenizer/CODEC/encodec/codec_datamodule.py @@ -143,7 +143,7 @@ class CodecDataModule: group.add_argument( "--input-strategy", type=str, - default="PrecomputedFeatures", + default="AudioSamples", help="AudioSamples or PrecomputedFeatures", ) diff --git a/egs/tokenizer/CODEC/encodec/loss.py b/egs/tokenizer/CODEC/encodec/loss.py index c6351ec65..9f0558569 100644 --- a/egs/tokenizer/CODEC/encodec/loss.py +++ b/egs/tokenizer/CODEC/encodec/loss.py @@ -300,13 +300,12 @@ class SpectrogramReconstructionLoss(torch.nn.Module): def __init__( self, - sampling_rate: int = 22050, return_spec: bool = False, ): super().__init__() self.wav_to_specs = [] - for i in range(5, 10): - s = 2**i // 8 + for i in range(5, 12): + s = 2**i self.wav_to_specs.append( Spectrogram( n_fft=s,