Skip to content

Commit

Permalink
add assert and comment to lightning module
Browse files Browse the repository at this point in the history
  • Loading branch information
hwangjeff committed Apr 13, 2022
1 parent 854ece9 commit da751eb
Showing 1 changed file with 13 additions and 2 deletions.
15 changes: 13 additions & 2 deletions examples/asr/librispeech_conformer_rnnt/lightning.py
Original file line number Diff line number Diff line change
Expand Up @@ -25,6 +25,8 @@

_spectrogram_transform = torchaudio.transforms.MelSpectrogram(sample_rate=16000, n_fft=400, n_mels=80, hop_length=160)

_expected_spm_vocab_size = 1023


def _piecewise_linear_log(x):
x[x > math.e] = torch.log(x[x > math.e])
Expand Down Expand Up @@ -195,6 +197,17 @@ def __init__(
):
super().__init__()

self.sp_model = spm.SentencePieceProcessor(model_file=sp_model_path)
spm_vocab_size = self.sp_model.get_piece_size()
assert spm_vocab_size == _expected_spm_vocab_size, (
"The model returned by conformer_rnnt_base expects a SentencePiece model of "
f"vocabulary size {_expected_spm_vocab_size}, but the given SentencePiece model has a vocabulary size "
f"of {spm_vocab_size}. Please provide a correctly configured SentencePiece model."
)
self.blank_idx = spm_vocab_size

# ``conformer_rnnt_base`` hardcodes a specific Conformer RNN-T configuration.
# For greater customizability, please refer to ``conformer_rnnt_model``.
self.model = conformer_rnnt_base()
self.loss = torchaudio.transforms.RNNTLoss(reduction="sum")
self.optimizer = torch.optim.Adam(self.model.parameters(), lr=8e-4, betas=(0.9, 0.98), eps=1e-9)
Expand All @@ -217,8 +230,6 @@ def __init__(

self.librispeech_path = librispeech_path

self.sp_model = spm.SentencePieceProcessor(model_file=sp_model_path)
self.blank_idx = self.sp_model.get_piece_size()
self.train_dataset_lengths = None
self.val_dataset_lengths = None

Expand Down

0 comments on commit da751eb

Please sign in to comment.