In [None]:
import pandas as pd
import numpy as np

import librosa
import librosa.display
import IPython.display as ipd

TRAIN_AUDIO_FOLDER = "../input/birdclef-2022/train_audio/"
TEST_AUDIO_FOLDER = "../input/birdclef-2022/test_soundscapes/"

TRAIN_PATH = "../input/birdclef-2022/train_metadata.csv"
TEST_PATH = "../input/birdclef-2022/test.csv"
SAMPLE_SUBMISSION_PATH = "../input/birdclef-2022/sample_submission.csv"

TAXONOMY_PATH = "../input/birdclef-2022/eBird_Taxonomy_v2021.csv"
SCORED_BIRDS_JSON = "../input/birdclef-2022/scored_birds.json"

AUDID_SAMPLE_PATH = "../input/birdclef-2022/train_audio/afrsil1/XC175522.ogg"

In [None]:
train = pd.read_csv(TRAIN_PATH)
test = pd.read_csv(TEST_PATH)

In [None]:
train.head()

In [None]:
train.info()

In [None]:
train.describe().T

# play audio 

In [None]:
ipd.Audio(AUDID_SAMPLE_PATH)

# load audio

In [None]:
audio_data, sample_rate = librosa.load(AUDID_SAMPLE_PATH)
print("audio data shape = ",audio_data.shape)
print("sample_rate = ",sample_rate)
print("audio data size= ",len(audio_data.data))

# show raw audio data

In [None]:
import matplotlib.pylab as plt
import seaborn as sns
import plotly.express as px

def show_raw_audio_data(filePath):
    y, sr = librosa.load(filePath)
    ax = pd.DataFrame(y).plot(figsize=(12, 5), title=filePath, lw=0.1)
    plt.legend().remove()
    plt.show()

show_raw_audio_data(AUDID_SAMPLE_PATH)

# show mel spectrogram 

In [None]:
def show_audio_melspec(filePath):
    y, sr = librosa.load(filePath)
    S = librosa.feature.melspectrogram(y=y, sr=sr, n_mels=80, fmax=8000)

    fig, ax = plt.subplots(figsize=(12, 5))
    S_dB = librosa.power_to_db(S, ref=np.max)
    img = librosa.display.specshow(
        S_dB, x_axis="time", y_axis="mel", sr=sr, fmax=8000, ax=ax
    )
    fig.colorbar(img, ax=ax, format="%+2.0f dB")
    ax.set(title=filePath)
    plt.show()
    
show_audio_melspec(AUDID_SAMPLE_PATH)