In [82]:
import librosa
import librosa.display
import numpy as np
import scipy
import tqdm

In [72]:
import random

In [6]:
musica

array([0., 0., 0., ..., 0., 0., 0.], dtype=float32)

In [15]:
def smooth(x,window_len=11,window='hanning'):
    """smooth the data using a window with requested size.
    
    This method is based on the convolution of a scaled window with the signal.
    The signal is prepared by introducing reflected copies of the signal 
    (with the window size) in both ends so that transient parts are minimized
    in the begining and end part of the output signal.
    
    input:
        x: the input signal 
        window_len: the dimension of the smoothing window; should be an odd integer
        window: the type of window from 'flat', 'hanning', 'hamming', 'bartlett', 'blackman'
            flat window will produce a moving average smoothing.

    output:
        the smoothed signal
        
    example:

    t=linspace(-2,2,0.1)
    x=sin(t)+randn(len(t))*0.1
    y=smooth(x)
    
    see also: 
    
    numpy.hanning, numpy.hamming, numpy.bartlett, numpy.blackman, numpy.convolve
    scipy.signal.lfilter
 
    TODO: the window parameter could be the window itself if an array instead of a string
    NOTE: length(output) != length(input), to correct this: return y[(window_len/2-1):-(window_len/2)] instead of just y.
    """


    s=np.r_[x[window_len-1:0:-1],x,x[-2:-window_len-1:-1]]
    #print(len(s))
    if window == 'flat': #moving average
        w=np.ones(window_len,'d')
    else:
        w=eval('np.'+window+'(window_len)')

    y=np.convolve(w/w.sum(),s,mode='valid')
    return y

In [166]:
def wave(f, duration):
    fs=sr
    samples = (np.sin(2*np.pi*np.arange(fs*duration)*f/fs)).astype(np.float32)
    return samples

def obstacle(length):
    samples = (np.sin(np.pi*np.arange(length)/(length))).astype(np.float32)
    samples+=0.1*np.random.rand(length)
#     print(length, samples.shape)
    return samples

In [262]:
musica, sr = librosa.load('b9.wav', sr=44100)
musica=smooth(musica, window_len=90)

In [263]:
mask=np.random.rand(musica.shape[0]+100)

In [264]:
ob_st_freq=200
ob_end_freq=10000

minlen=int(sr/ob_end_freq)
maxlen=int(sr/ob_st_freq)
for i in tqdm.trange(0, 20000):
    pos=random.randint(2*maxlen, musica.shape[0]-2*maxlen)
    le=random.randint(minlen, maxlen)
    obs=obstacle(le)
#     print(obs.shape)
    mask[pos:pos+le]+=obs
    
mask=smooth(mask, window_len=80)

100%|██████| 20000/20000 [00:00<00:00, 60784.55it/s]


In [265]:
mask*=0.02
musica+=mask[0:musica.shape[0]]

In [266]:
librosa.output.write_wav('gen.wav', musica, sr)
librosa.output.write_wav('mask.wav', mask, sr)

array([0.00000000e+00, 1.07887821e-01, 3.97492719e-03, 7.27619877e-01,
       7.35685341e-01, 7.94387107e-01, 3.30880846e-01, 4.77273906e-02,
       2.46996278e-01, 8.22792903e-17])