## Basic imports

In [1]:
import numpy as np
import pandas

import wqio
import pynsqd
import pycvc

## Load and export from the `pycvc` external module

In [2]:
nsqdata = pycvc.external.nsqd('red', 'd')
nsqdata.data.to_csv("nsqdata_in_pycvc.csv", index=False)
nsqdata.medians.to_csv('ED1_influent_medians.csv', index=False)
nsqdata.datacollection.tidy.to_csv("nsqtidy.csv", index=False)



### Read in and ROS the hand-filtered data

In [3]:
main_cols = [
    'epa_rain_zone', 'season', 'primary_landuse',
    'parameter', 'fraction', 'units', 'res', 'qual'
]

df = pandas.read_csv("nsqdata_example_subset.csv", usecols=main_cols)
df['cen'] = df['qual'].isin(['<'])
df.head()

Unnamed: 0,epa_rain_zone,primary_landuse,season,parameter,fraction,units,res,qual,cen
0,1,Residential,spring,Cadmium,Total,ug/L,10,<,True
1,1,Residential,spring,Cadmium,Total,ug/L,10,<,True
2,1,Residential,spring,Cadmium,Total,ug/L,10,<,True
3,1,Residential,spring,Cadmium,Total,ug/L,10,<,True
4,1,Residential,spring,Cadmium,Total,ug/L,1,<,True


## Show medians computed from the subset above

In [4]:
ros = wqio.robustros.RobustROSEstimator(data=df)
np.median(ros.estimated_values)

0.35189348345894644

## Show the same result used in `pycvc`

In [5]:
nsqdata.season_medians.query("parameter == 'Cadmium (Cd)' and season == 'spring'")

Unnamed: 0,parameter,season,lower,NSQD Medians,upper
1,Cadmium (Cd),spring,0.172,0.352,0.525
