In [None]:
# Note: restart runtime after this import before running the augmentations
!pip install -U augly[audio]
!sudo apt-get install python3-magic

In [None]:
import os
import augly.audio as audaugs
import augly.utils as utils
from IPython.display import display, Audio

# Get input audio
input_audio = os.path.join(
    utils.TEST_URI, "audio", "inputs", "vad-go-stereo-44100.wav"
)
display(Audio(input_audio))

In [None]:
# Now we can apply various augmentations to the audio!
aug_audio, sr = audaugs.pitch_shift(input_audio, n_steps=4.0)
display(Audio(aug_audio, rate=sr))

In [None]:
"""
You can optionally pass in a metadata list, to which metadata about the
augmentation will be appended, including kwargs, the durations & number of
channels of the input & output audio clips, the matching segments in the
input/output audio clips (useful in case of temporal editing), and intensity
(defined based on the kwargs for each augmentation).
"""
meta = []
aug_audio, sr = audaugs.time_stretch(
    input_audio,
    rate=0.5,
    metadata=meta,
)
display(Audio(aug_audio, rate=sr))
meta

In [None]:
# For all the augmentations, we have class-based definitions as well as
# functional
from augly.audio.utils import validate_and_load_audio

input_audio_arr, sr = validate_and_load_audio(input_audio)
meta = []
aug = audaugs.PeakingEqualizer()
aug_audio, sr = aug(input_audio_arr, sample_rate=sr, metadata=meta)
display(Audio(aug_audio, rate=sr))
meta

In [None]:
# You can also compose several transformations together
meta = []
aug = audaugs.Compose(
    [
        audaugs.AddBackgroundNoise(),
        audaugs.ToMono(),
        audaugs.Clicks(),
    ]
)
aug_audio, sr = aug(input_audio_arr, sample_rate=sr, metadata=meta)
display(Audio(aug_audio, rate=sr))
meta