# Getting data for Quito

For this case, data was collected manually

Source: https://qualar.cetesb.sp.gov.br/qualar/exportaDadosAvanc.do?method=filtrarParametros

In [2]:
# libraries
import h3
import pandas as pd
import seaborn as sns
import matplotlib.pyplot as plt

In [3]:
# read csv with data
df=pd.read_csv('dadosSP.csv',delimiter=';')
# read csv with coordinates
dfCoordenates=pd.read_csv('coordenadas.csv',delimiter=';')
dfCoordenates['Station']=df.Station.unique()

In [4]:
dfCoordenates.set_index('Station',inplace=True)
# get h3id for stations
dfCoordenates['h3id'] = dfCoordenates.apply(lambda row: h3.geo_to_h3(row.Latitude, row.Longitude, 9), axis=1)

h3dict = dfCoordenates.h3id.to_dict()

In [5]:
# join date and hour in dataframe df
df['Date']=pd.to_datetime(df.Date) + pd.to_timedelta(df.Hour)
df.drop(columns=['Hour'],inplace=True)

# convert other columns to numeric
df[df.columns[2:]] = df[df.columns[2:]].apply(pd.to_numeric, errors='coerce', axis=1)

### April 2019

In [6]:
# April 2019
i = pd.date_range('2019-04-01 00:00:00', periods=31, freq='24H')
dfTemp=df.loc[(df.Date >= i[0]) & (df.Date <= i[-1])].copy()
# indexes for 2019-05-01
temp=dfTemp.loc[dfTemp['Date']==pd.date_range('2019-05-01 00:00:00', periods=1, freq='24H')[0]].index
# Remove 2019-05-01
dfTemp.drop(temp,inplace=True)
# Reset index
dfTemp.reset_index(inplace=True,drop=True)

In [7]:
dfTemp['h3id'] = dfTemp.Station.apply(lambda s: h3dict[s])
dfTemp['time'] = pd.to_datetime(dfTemp.Date)
# convert ug/m3 to ppb
# The conversion assumes an ambient pressure of 1 atmosphere and a temperature of 25 degrees Celsius.
# https://www2.dmu.dk/atmosphericenvironment/expost/database/docs/ppm_conversion.pdf
dfTemp['NO2']=dfTemp['NO2']/1.88
dfTemp['NO']=dfTemp['NO']/1.25

In [8]:
# save data as .csv
dfTemp[['h3id', 'time', 'NO2', 'NO']].to_csv('y_data.csv', index=False)