pytorch
diff --git a/‎beginner_source/audio_data_augmentation_tutorial.py
Lines changed: 4 additions & 436 deletions b/‎beginner_source/audio_data_augmentation_tutorial.py
Lines changed: 4 additions & 436 deletions
diff --git a/‎beginner_source/audio_datasets_tutorial.py
Lines changed: 5 additions & 81 deletions b/‎beginner_source/audio_datasets_tutorial.py
Lines changed: 5 additions & 81 deletions
diff --git a/‎beginner_source/audio_feature_augmentation_tutorial.py
Lines changed: 5 additions & 162 deletions b/‎beginner_source/audio_feature_augmentation_tutorial.py
Lines changed: 5 additions & 162 deletions
@@ -3,85 +3,9 @@
 Audio Datasets
 ==============
 
-``torchaudio`` provides easy access to common, publicly accessible
-datasets. Please refer to the official documentation for the list of
-available datasets.
-"""
-
-# When running this tutorial in Google Colab, install the required packages
-# with the following.
-# !pip install torchaudio
-
-import torch
-import torchaudio
-
-print(torch.__version__)
-print(torchaudio.__version__)
-
-######################################################################
-# Preparing data and utility functions (skip this section)
-# --------------------------------------------------------
-#
-
-# @title Prepare data and utility functions. {display-mode: "form"}
-# @markdown
-# @markdown You do not need to look into this cell.
-# @markdown Just execute once and you are good to go.
-
-# -------------------------------------------------------------------------------
-# Preparation of data and helper functions.
-# -------------------------------------------------------------------------------
-import multiprocessing
-import os
-
-import matplotlib.pyplot as plt
-from IPython.display import Audio, display
-
-
-_SAMPLE_DIR = "_assets"
-YESNO_DATASET_PATH = os.path.join(_SAMPLE_DIR, "yes_no")
-os.makedirs(YESNO_DATASET_PATH, exist_ok=True)
-
+This tutorial has been moved to https://pytorch.org/tutorials/beginner/audio_datasets_tutorial.html
 
-def plot_specgram(waveform, sample_rate, title="Spectrogram", xlim=None):
-    waveform = waveform.numpy()
-
-    num_channels, num_frames = waveform.shape
-
-    figure, axes = plt.subplots(num_channels, 1)
-    if num_channels == 1:
-        axes = [axes]
-    for c in range(num_channels):
-        axes[c].specgram(waveform[c], Fs=sample_rate)
-        if num_channels > 1:
-            axes[c].set_ylabel(f"Channel {c+1}")
-        if xlim:
-            axes[c].set_xlim(xlim)
-    figure.suptitle(title)
-    plt.show(block=False)
-
-
-def play_audio(waveform, sample_rate):
-    waveform = waveform.numpy()
-
-    num_channels, num_frames = waveform.shape
-    if num_channels == 1:
-        display(Audio(waveform[0], rate=sample_rate))
-    elif num_channels == 2:
-        display(Audio((waveform[0], waveform[1]), rate=sample_rate))
-    else:
-        raise ValueError("Waveform with more than 2 channels are not supported.")
-
-
-######################################################################
-# Here, we show how to use the
-# :py:func:`torchaudio.datasets.YESNO` dataset.
-#
-
-
-dataset = torchaudio.datasets.YESNO(YESNO_DATASET_PATH, download=True)
-
-for i in [1, 3, 5]:
-    waveform, sample_rate, label = dataset[i]
-    plot_specgram(waveform, sample_rate, title=f"Sample {i}: {label}")
-    play_audio(waveform, sample_rate)
+It will redirect in 3 seconds.
+.. raw::html
+   <meta http-equiv="Refresh" content="3; url='https://pytorch.org/tutorials/beginner/audio_datasets_tutorial.html'" />
+"""
@@ -2,167 +2,10 @@
 """
 Audio Feature Augmentation
 ==========================
-"""
-
-# When running this tutorial in Google Colab, install the required packages
-# with the following.
-# !pip install torchaudio librosa
-
-import torch
-import torchaudio
-import torchaudio.transforms as T
-
-print(torch.__version__)
-print(torchaudio.__version__)
-
-######################################################################
-# Preparing data and utility functions (skip this section)
-# --------------------------------------------------------
-#
-
-# @title Prepare data and utility functions. {display-mode: "form"}
-# @markdown
-# @markdown You do not need to look into this cell.
-# @markdown Just execute once and you are good to go.
-# @markdown
-# @markdown In this tutorial, we will use a speech data from [VOiCES dataset](https://iqtlabs.github.io/voices/),
-# @markdown which is licensed under Creative Commos BY 4.0.
-
-# -------------------------------------------------------------------------------
-# Preparation of data and helper functions.
-# -------------------------------------------------------------------------------
-
-import os
-
-import librosa
-import matplotlib.pyplot as plt
-import requests
-
-
-_SAMPLE_DIR = "_assets"
-
-SAMPLE_WAV_SPEECH_URL = "https://pytorch-tutorial-assets.s3.amazonaws.com/VOiCES_devkit/source-16k/train/sp0307/Lab41-SRI-VOiCES-src-sp0307-ch127535-sg0042.wav"  # noqa: E501
-SAMPLE_WAV_SPEECH_PATH = os.path.join(_SAMPLE_DIR, "speech.wav")
-
-os.makedirs(_SAMPLE_DIR, exist_ok=True)
-
-
-def _fetch_data():
-    uri = [
-        (SAMPLE_WAV_SPEECH_URL, SAMPLE_WAV_SPEECH_PATH),
-    ]
-    for url, path in uri:
-        with open(path, "wb") as file_:
-            file_.write(requests.get(url).content)
-
-
-_fetch_data()
-
-
-def _get_sample(path, resample=None):
-    effects = [["remix", "1"]]
-    if resample:
-        effects.extend(
-            [
-                ["lowpass", f"{resample // 2}"],
-                ["rate", f"{resample}"],
-            ]
-        )
-    return torchaudio.sox_effects.apply_effects_file(path, effects=effects)
-
-
-def get_speech_sample(*, resample=None):
-    return _get_sample(SAMPLE_WAV_SPEECH_PATH, resample=resample)
-
 
-def get_spectrogram(
-    n_fft=400,
-    win_len=None,
-    hop_len=None,
-    power=2.0,
-):
-    waveform, _ = get_speech_sample()
-    spectrogram = T.Spectrogram(
-        n_fft=n_fft,
-        win_length=win_len,
-        hop_length=hop_len,
-        center=True,
-        pad_mode="reflect",
-        power=power,
-    )
-    return spectrogram(waveform)
+This tutorial has been moved to https://pytorch.org/audio/stable/tutorials/audio_data_augmentation_tutorial.html
 
-
-def plot_spectrogram(spec, title=None, ylabel="freq_bin", aspect="auto", xmax=None):
-    fig, axs = plt.subplots(1, 1)
-    axs.set_title(title or "Spectrogram (db)")
-    axs.set_ylabel(ylabel)
-    axs.set_xlabel("frame")
-    im = axs.imshow(librosa.power_to_db(spec), origin="lower", aspect=aspect)
-    if xmax:
-        axs.set_xlim((0, xmax))
-    fig.colorbar(im, ax=axs)
-    plt.show(block=False)
-
-
-######################################################################
-# SpecAugment
-# -----------
-#
-# `SpecAugment <https://ai.googleblog.com/2019/04/specaugment-new-data-augmentation.html>`__
-# is a popular spectrogram augmentation technique.
-#
-# ``torchaudio`` implements :py:func:`torchaudio.transforms.TimeStretch`,
-# :py:func:`torchaudio.transforms.TimeMasking` and
-# :py:func:`torchaudio.transforms.FrequencyMasking`.
-#
-
-######################################################################
-# TimeStretch
-# -----------
-#
-
-
-spec = get_spectrogram(power=None)
-stretch = T.TimeStretch()
-
-rate = 1.2
-spec_ = stretch(spec, rate)
-plot_spectrogram(torch.abs(spec_[0]), title=f"Stretched x{rate}", aspect="equal", xmax=304)
-
-plot_spectrogram(torch.abs(spec[0]), title="Original", aspect="equal", xmax=304)
-
-rate = 0.9
-spec_ = stretch(spec, rate)
-plot_spectrogram(torch.abs(spec_[0]), title=f"Stretched x{rate}", aspect="equal", xmax=304)
-
-######################################################################
-# TimeMasking
-# -----------
-#
-
-torch.random.manual_seed(4)
-
-spec = get_spectrogram()
-plot_spectrogram(spec[0], title="Original")
-
-masking = T.TimeMasking(time_mask_param=80)
-spec = masking(spec)
-
-plot_spectrogram(spec[0], title="Masked along time axis")
-
-######################################################################
-# FrequencyMasking
-# ----------------
-#
-
-
-torch.random.manual_seed(4)
-
-spec = get_spectrogram()
-plot_spectrogram(spec[0], title="Original")
-
-masking = T.FrequencyMasking(freq_mask_param=80)
-spec = masking(spec)
-
-plot_spectrogram(spec[0], title="Masked along frequency axis")
+It will redirect in 3 seconds.
+.. raw::html
+   <meta http-equiv="Refresh" content="3; url='https://pytorch.org/audio/stable/tutorials/audio_data_augmentation_tutorial.html'" />
+"""