Skip to content

Commit

Permalink
Fix audio data augmentation tutorial (#1987)
Browse files Browse the repository at this point in the history
Addresses: #1930
Ref: pytorch/audio#2595
  • Loading branch information
mthrok authored Aug 1, 2022
1 parent 7976ab1 commit 4132e11
Showing 1 changed file with 4 additions and 4 deletions.
8 changes: 4 additions & 4 deletions beginner_source/audio_data_augmentation_tutorial.py
Original file line number Diff line number Diff line change
Expand Up @@ -239,14 +239,14 @@ def plot_specgram(waveform, sample_rate, title="Spectrogram", xlim=None):
noise, _ = torchaudio.load(SAMPLE_NOISE)
noise = noise[:, : speech.shape[1]]

speech_power = speech.norm(p=2)
noise_power = noise.norm(p=2)
speech_rms = speech.norm(p=2)
noise_rms = noise.norm(p=2)

snr_dbs = [20, 10, 3]
noisy_speeches = []
for snr_db in snr_dbs:
snr = 10 ** (snr_db / 20)
scale = snr * noise_power / speech_power
scale = snr * noise_rms / speech_rms
noisy_speeches.append((scale * speech + noise) / 2)

######################################################################
Expand Down Expand Up @@ -376,7 +376,7 @@ def plot_specgram(waveform, sample_rate, title="Spectrogram", xlim=None):
noise = noise[:, : rir_applied.shape[1]]

snr_db = 8
scale = math.exp(snr_db / 10) * noise.norm(p=2) / rir_applied.norm(p=2)
scale = (10 ** (snr_db / 20)) * noise.norm(p=2) / rir_applied.norm(p=2)
bg_added = (scale * rir_applied + noise) / 2

plot_specgram(bg_added, sample_rate, title="BG noise added")
Expand Down

0 comments on commit 4132e11

Please sign in to comment.