<img src="images/logo.png" width="300">

In [1]:
#import modules

import numpy as np
import pandas as pd
import ipywidgets as widg
import IPython.display as idisp
import plotly.graph_objects as go


In [2]:
#color functions

predify_color = '0,71,187' #Predify dark blue

#print markdown text in color
def html( prefix, text ):
    idisp.display( idisp.Markdown( '{} <span style="color: rgb({})">{}</span>'.format( prefix, predify_color, text ) ) )


In [3]:
html( '#', 'Análisis de spots (Auditsa) y ratings (Inra) en la radio mexicana' )

# <span style="color: rgb(0,71,187)">Análisis de spots (Auditsa) y ratings (Inra) en la radio mexicana</span>

In [4]:
#initial settings

loadflag = 'y' #load files ('y') or calculate from scratch ('n')

dataloc = 'data/' #location of raw datafiles
imgloc = 'images/' #location of images

#plot settings

plot_props = { 'marker' : 'o',
    'ms' : 12,
    'ls' : '-',
    'lw' : 3,
    'fontsize' : 20,
    'xylabel' : 20,
    'ticklabel' : 15,
    'legend_prop' : { 'size':15 },
    'legend_hlen' : 2,
    'legend_np' : 2 }


In [5]:
#data loading

savename = dataloc+'data.h5' #HDF5 savename

data = {} #raw data
data['auditsa'] = pd.read_hdf( savename, key='auditsa' )
data['inra'] = pd.read_hdf( savename, key='inra' )


In [6]:
html( '###', 'Columnas en datos' )

### <span style="color: rgb(0,71,187)">Columnas en datos</span>

In [7]:
#get columns in dataset

def columns_dataset( base ):
    for col in data[ base ].columns:
        print(col)
        
idisp.display( widg.interactive( columns_dataset, base=data.keys() ) ) #get columns in dataset


interactive(children=(Dropdown(description='base', options=('auditsa', 'inra'), value='auditsa'), Output()), _…

In [8]:
html( '###', 'Elementos más comunes' )

### <span style="color: rgb(0,71,187)">Elementos más comunes</span>

In [9]:
#get top elements in column

def top_elements_column( df, columna, top ):
    print( df[ columna ].value_counts()[:top] )

html( '###', 'Auditsa' )
    
idisp.display( widg.interactive( top_elements_column, df=widg.fixed( data['auditsa'] ),
                                 columna=data['auditsa'].columns, top=(1, 30) ) ) #get top elements in column


### <span style="color: rgb(0,71,187)">Auditsa</span>

interactive(children=(Dropdown(description='columna', options=('categoria', 'compania', 'competencia', 'estaci…

In [10]:
html( '###', 'Inra' )

idisp.display( widg.interactive( top_elements_column, df=widg.fixed( data['inra'] ),
                                 columna=data['inra'].columns, top=(1, 30) ) ) #get top elements in column


### <span style="color: rgb(0,71,187)">Inra</span>

interactive(children=(Dropdown(description='columna', options=('plaza', 'mes', 'estudio', 'dias', 'target', 'u…

In [11]:
html( '###', 'Estaciones por plaza' )

### <span style="color: rgb(0,71,187)">Estaciones por plaza</span>

In [12]:
#get stations per place

def stations_place( df, plaza ):
    group_plaza_auditsa = df.groupby( 'plaza' ).get_group( plaza )
    
    for estacion in group_plaza_auditsa['estacion'].sort_values().unique():
        print( estacion )

html( '###', 'Auditsa' )
        
idisp.display( widg.interactive( stations_place, df=widg.fixed( data['auditsa'] ),
                                 plaza=data['auditsa']['plaza'].unique() ) ) #get stations per place

### <span style="color: rgb(0,71,187)">Auditsa</span>

interactive(children=(Dropdown(description='plaza', options=('Monterrey', 'Puebla', 'Ciudad de México', 'Cuern…

In [13]:
html( '###', 'Inra' )

idisp.display( widg.interactive( stations_place, df=widg.fixed( data['inra'] ),
                                 plaza=data['inra']['plaza'].unique() ) ) #get stations per place

### <span style="color: rgb(0,71,187)">Inra</span>

interactive(children=(Dropdown(description='plaza', options=('Ciudad de México', 'Monterrey', 'Guadalajara', '…

In [14]:
#plot total number of spots in stations

months = [ 'enero', 'febrero', 'marzo', 'abril', 'mayo' ] #months in right order

#plot total number of spots in stations
def plot_spots_station( estacion_1, estacion_2 ):
    
    cond_1 = data['auditsa']['estacion'] == estacion_1 #condition to filter data
    yplot_1 = data['auditsa'][ cond_1 ].groupby( 'mes' )['hits'].agg( np.sum ).reindex( months ) #aggregate by month

    cond_2 = data['auditsa']['estacion'] == estacion_2 #condition to filter data
    yplot_2 = data['auditsa'][ cond_2 ].groupby( 'mes' )['hits'].agg( np.sum ).reindex( months ) #aggregate by month
    
    #initialise plot
    fig = go.Figure()
    fig.update_layout( title='Número de spots en estaciones',
                       xaxis_title='mes',
                       yaxis_title='Número de spots' )
    
    #plot plot!
    fig.add_trace( go.Scatter( x=yplot_1.index, y=yplot_1, name=estacion_1 ) )
    fig.add_trace( go.Scatter( x=yplot_2.index, y=yplot_2, name=estacion_2 ) )
    
    #finalise plot
    fig.show()

#display interactive widget
idisp.display( widg.interactive( plot_spots_station, estacion_1=data['auditsa']['estacion'].sort_values().unique(),
                                 estacion_2=data['auditsa']['estacion'].sort_values().unique() ) )

interactive(children=(Dropdown(description='estacion_1', options=('CDMX XEABC-AM - (760 AM) ABC Radio', 'CDMX …