In [1]:
import ast
import pandas as pd
import numpy as np
import altair as alt 
from altair import Chart, X, Y, Color, Scale

In [2]:
df = pd.read_csv('new_york.csv').dropna(axis=1, how='all')
df.head()

Unnamed: 0,state,site,disposal.area,type,well.id,gradient,samp.date,contaminant,measurement.unit,concentration
0,NY,Dunkirk Generating Station,Dunkirk Landfill,L,BR-14-UG,Upgradient,8/30/16,"Mercury, total",mg/l,5e-07
1,NY,Dunkirk Generating Station,Dunkirk Landfill,L,BR-14-UG,Upgradient,5/16/17,"Antimony, total",mg/l,0.001
2,NY,Dunkirk Generating Station,Dunkirk Landfill,L,BR-20-DG,Downgradient,5/16/17,"Antimony, total",mg/l,0.0014
3,NY,Dunkirk Generating Station,Dunkirk Landfill,L,BR-13-DG,Downgradient,5/16/17,"Antimony, total",mg/l,0.0015
4,NY,Dunkirk Generating Station,Dunkirk Landfill,L,BR-3-DG,Downgradient,5/16/17,"Antimony, total",mg/l,0.0016


In [3]:
#removing state column (not relevant as they are all new york)
df = df.drop(columns='state')
df.head()

Unnamed: 0,site,disposal.area,type,well.id,gradient,samp.date,contaminant,measurement.unit,concentration
0,Dunkirk Generating Station,Dunkirk Landfill,L,BR-14-UG,Upgradient,8/30/16,"Mercury, total",mg/l,5e-07
1,Dunkirk Generating Station,Dunkirk Landfill,L,BR-14-UG,Upgradient,5/16/17,"Antimony, total",mg/l,0.001
2,Dunkirk Generating Station,Dunkirk Landfill,L,BR-20-DG,Downgradient,5/16/17,"Antimony, total",mg/l,0.0014
3,Dunkirk Generating Station,Dunkirk Landfill,L,BR-13-DG,Downgradient,5/16/17,"Antimony, total",mg/l,0.0015
4,Dunkirk Generating Station,Dunkirk Landfill,L,BR-3-DG,Downgradient,5/16/17,"Antimony, total",mg/l,0.0016


In [4]:
#removing date column (not relevant as they are all samples)
df = df.drop(columns='samp.date')
df.head()

Unnamed: 0,site,disposal.area,type,well.id,gradient,contaminant,measurement.unit,concentration
0,Dunkirk Generating Station,Dunkirk Landfill,L,BR-14-UG,Upgradient,"Mercury, total",mg/l,5e-07
1,Dunkirk Generating Station,Dunkirk Landfill,L,BR-14-UG,Upgradient,"Antimony, total",mg/l,0.001
2,Dunkirk Generating Station,Dunkirk Landfill,L,BR-20-DG,Downgradient,"Antimony, total",mg/l,0.0014
3,Dunkirk Generating Station,Dunkirk Landfill,L,BR-13-DG,Downgradient,"Antimony, total",mg/l,0.0015
4,Dunkirk Generating Station,Dunkirk Landfill,L,BR-3-DG,Downgradient,"Antimony, total",mg/l,0.0016


In [5]:
#renaming columns for simplicity
df = df.rename(columns={'disposal.area': 'disposal', 'measurement.unit': 'unit', 'well.id': 'well'})
df.head()

Unnamed: 0,site,disposal,type,well,gradient,contaminant,unit,concentration
0,Dunkirk Generating Station,Dunkirk Landfill,L,BR-14-UG,Upgradient,"Mercury, total",mg/l,5e-07
1,Dunkirk Generating Station,Dunkirk Landfill,L,BR-14-UG,Upgradient,"Antimony, total",mg/l,0.001
2,Dunkirk Generating Station,Dunkirk Landfill,L,BR-20-DG,Downgradient,"Antimony, total",mg/l,0.0014
3,Dunkirk Generating Station,Dunkirk Landfill,L,BR-13-DG,Downgradient,"Antimony, total",mg/l,0.0015
4,Dunkirk Generating Station,Dunkirk Landfill,L,BR-3-DG,Downgradient,"Antimony, total",mg/l,0.0016


In [6]:
#removing 'total' after contaminant names
df = df.replace(to_replace='[n,] total', value='', regex=True)
df.head()

Unnamed: 0,site,disposal,type,well,gradient,contaminant,unit,concentration
0,Dunkirk Generating Station,Dunkirk Landfill,L,BR-14-UG,Upgradient,Mercury,mg/l,5e-07
1,Dunkirk Generating Station,Dunkirk Landfill,L,BR-14-UG,Upgradient,Antimony,mg/l,0.001
2,Dunkirk Generating Station,Dunkirk Landfill,L,BR-20-DG,Downgradient,Antimony,mg/l,0.0014
3,Dunkirk Generating Station,Dunkirk Landfill,L,BR-13-DG,Downgradient,Antimony,mg/l,0.0015
4,Dunkirk Generating Station,Dunkirk Landfill,L,BR-3-DG,Downgradient,Antimony,mg/l,0.0016


In [7]:
#how many different contaminants
df['contaminant'].nunique()

21

In [8]:
#what are the different contaminants
#periods work as well as brackets^^^

#question: what is ph?, what is TDS?, do we need the numbers after radium?

df.contaminant.unique()

array(['Mercury', 'Antimony', 'Lead', 'Arsenic', 'Chromium', 'Thallium',
       'Barium', 'Boron', 'Radium 226+228', 'Fluoride', 'Chloride', 'pH',
       'Calcium', 'Sulfate', 'Total Dissolved Solids', 'Beryllium',
       'Cadmium', 'Selenium', 'Molybdenum', 'Cobalt', 'Lithium'],
      dtype=object)

In [9]:
#what are the different sites
df.site.unique()

array(['Dunkirk Generating Station', 'Huntley Generating Station'],
      dtype=object)

In [10]:
#what are the different disposals

#question: what are disposals??? vs. sites??

df.disposal.unique()

array(['Dunkirk Landfill', 'Huntley Landfill', 'South Settling Pond'],
      dtype=object)

In [11]:
#what are the different types

#question: what do these mean??, can we combine them?

df.type.unique()

array(['L', 'SI'], dtype=object)

In [12]:
#question: can we convert them all to mg/l, or get rid of non mg/l?
#pCi/L is for Radium
#su is for pH

df.unit.unique()

array(['mg/l', 'pCi/l', 'su'], dtype=object)

In [13]:
#how many different wells
df.well.nunique()

17

In [14]:
#what are the different wells
df.well.unique()

array(['BR-14-UG', 'BR-20-DG', 'BR-13-DG', 'BR-3-DG', 'BR-12-DG',
       'MW-13D', 'A-2', 'CCR-4', 'CCR-5', 'CCR-6', 'MW-7D', 'CCR-3',
       'MW-11D', 'MW-14D', 'CCR-2', 'MW-12D', 'CCR-1'], dtype=object)

In [15]:
#find contaminant concentration averages for dict

BR14_Medf = df.loc[(df['well'] == 'BR-14-UG') & (df['contaminant'] == 'Mercury')]
BR14_Medf

Unnamed: 0,site,disposal,type,well,gradient,contaminant,unit,concentration
0,Dunkirk Generating Station,Dunkirk Landfill,L,BR-14-UG,Upgradient,Mercury,mg/l,5e-07
382,Dunkirk Generating Station,Dunkirk Landfill,L,BR-14-UG,Upgradient,Mercury,mg/l,5e-07
383,Dunkirk Generating Station,Dunkirk Landfill,L,BR-14-UG,Upgradient,Mercury,mg/l,5e-07
384,Dunkirk Generating Station,Dunkirk Landfill,L,BR-14-UG,Upgradient,Mercury,mg/l,5e-07
385,Dunkirk Generating Station,Dunkirk Landfill,L,BR-14-UG,Upgradient,Mercury,mg/l,5e-07
386,Dunkirk Generating Station,Dunkirk Landfill,L,BR-14-UG,Upgradient,Mercury,mg/l,5e-07
387,Dunkirk Generating Station,Dunkirk Landfill,L,BR-14-UG,Upgradient,Mercury,mg/l,5e-07
416,Dunkirk Generating Station,Dunkirk Landfill,L,BR-14-UG,Upgradient,Mercury,mg/l,1e-06


In [16]:
BR14_Medf.concentration.mean()

5.624999999999999e-07

In [17]:
BR14_Andf = df.loc[(df['well'] == 'BR-14-UG') & (df['contaminant'] == 'Antimony')]
BR14_Andf.concentration.mean()

0.0454375

In [18]:
BR14_Ledf = df.loc[(df['well'] == 'BR-14-UG') & (df['contaminant'] == 'Lead')]
BR14_Ardf = df.loc[(df['well'] == 'BR-14-UG') & (df['contaminant'] == 'Arsenic')]
BR14_Chrdf = df.loc[(df['well'] == 'BR-14-UG') & (df['contaminant'] == 'Chromium')]
BR14_Tdf = df.loc[(df['well'] == 'BR-14-UG') & (df['contaminant'] == 'Thallium')]
BR14_Badf = df.loc[(df['well'] == 'BR-14-UG') & (df['contaminant'] == 'Barium')]
BR14_Bodf = df.loc[(df['well'] == 'BR-14-UG') & (df['contaminant'] == 'Boron')]
BR14_Rdf = df.loc[(df['well'] == 'BR-14-UG') & (df['contaminant'] == 'Radium 226+228')]
BR14_Fdf = df.loc[(df['well'] == 'BR-14-UG') & (df['contaminant'] == 'Fluoride')]
BR14_Chldf = df.loc[(df['well'] == 'BR-14-UG') & (df['contaminant'] == 'Chloride')]
BR14_Pdf = df.loc[(df['well'] == 'BR-14-UG') & (df['contaminant'] == 'pH')]
BR14_Caldf = df.loc[(df['well'] == 'BR-14-UG') & (df['contaminant'] == 'Calcium')]
BR14_Sudf = df.loc[(df['well'] == 'BR-14-UG') & (df['contaminant'] == 'Sulfate')]
BR14_TDSdf = df.loc[(df['well'] == 'BR-14-UG') & (df['contaminant'] == 'Total Dissolved Solids')]
BR14_Berdf = df.loc[(df['well'] == 'BR-14-UG') & (df['contaminant'] == 'Beryllium')]
BR14_Caddf = df.loc[(df['well'] == 'BR-14-UG') & (df['contaminant'] == 'Cadmium')]
BR14_Sedf = df.loc[(df['well'] == 'BR-14-UG') & (df['contaminant'] == 'Selenium')]
BR14_Modf = df.loc[(df['well'] == 'BR-14-UG') & (df['contaminant'] == 'Molybdenum')]
BR14_Codf = df.loc[(df['well'] == 'BR-14-UG') & (df['contaminant'] == 'Cobalt')]
BR14_Lidf = df.loc[(df['well'] == 'BR-14-UG') & (df['contaminant'] == 'Lithium')]

In [19]:
#make a dictionary for each well that has the average of each contaminant concentration

BR14_dict = {'mercury_avg': BR14_Medf.concentration.mean(), 'antimony_avg': BR14_Andf.concentration.mean(), 'lead_avg': BR14_Ledf.concentration.mean(), 'arsenic_avg': BR14_Ardf.concentration.mean(), 'chromium_avg': BR14_Chrdf.concentration.mean(), 'thallium_avg': BR14_Tdf.concentration.mean(), 'barium_avg': BR14_Badf.concentration.mean(), 'boron_avg': BR14_Bodf.concentration.mean(), 'radium_avg': BR14_Rdf.concentration.mean(), 'fluoride_avg': BR14_Fdf.concentration.mean(), 'chloride_avg': BR14_Chldf.concentration.mean(), 'pH_avg': BR14_Pdf.concentration.mean(), 'calcium_avg': BR14_Caldf.concentration.mean(), 'sulfate_avg': BR14_Sudf.concentration.mean(), 'TDS_avg': BR14_TDSdf.concentration.mean(), 'beryllium_avg': BR14_Berdf.concentration.mean(), 'cadmium_avg': BR14_Caddf.concentration.mean(), 'selenium_avg': BR14_Sedf.concentration.mean(), 'molybdenum_avg': BR14_Modf.concentration.mean(), 'cobalt_avg': BR14_Codf.concentration.mean(), 'lithium_avg': BR14_Lidf.concentration.mean()}
BR14_dict

{'mercury_avg': 5.624999999999999e-07,
 'antimony_avg': 0.0454375,
 'lead_avg': 0.005,
 'arsenic_avg': 0.005874999999999999,
 'chromium_avg': 0.005,
 'thallium_avg': 0.007675000000000001,
 'barium_avg': 0.16625,
 'boron_avg': 0.17844444444444446,
 'radium_avg': 0.48750000000000004,
 'fluoride_avg': 0.2033333333333333,
 'chloride_avg': 3.6666666666666665,
 'pH_avg': 7.083333333333334,
 'calcium_avg': 95.22222222222223,
 'sulfate_avg': 108.66666666666667,
 'TDS_avg': 477.22222222222223,
 'beryllium_avg': 0.00475,
 'cadmium_avg': 0.005,
 'selenium_avg': 0.005,
 'molybdenum_avg': 0.01,
 'cobalt_avg': 0.049999999999999996,
 'lithium_avg': 0.049999999999999996}

In [20]:
df.loc[(df['contaminant'] == 'Radium 226+228')].concentration.mean()

0.8573600000000002

In [21]:
BR20_Medf = df.loc[(df['well'] == 'BR-20-DG') & (df['contaminant'] == 'Mercury')].concentration.mean()
BR20_Andf = df.loc[(df['well'] == 'BR-20-DG') & (df['contaminant'] == 'Antimony')].concentration.mean()
BR20_Ledf = df.loc[(df['well'] == 'BR-20-DG') & (df['contaminant'] == 'Lead')].concentration.mean()
BR20_Ardf = df.loc[(df['well'] == 'BR-20-DG') & (df['contaminant'] == 'Arsenic')].concentration.mean()
BR20_Chrdf = df.loc[(df['well'] == 'BR-20-DG') & (df['contaminant'] == 'Chromium')].concentration.mean()
BR20_Tdf = df.loc[(df['well'] == 'BR-20-DG') & (df['contaminant'] == 'Thallium')].concentration.mean()
BR20_Badf = df.loc[(df['well'] == 'BR-20-DG') & (df['contaminant'] == 'Barium')].concentration.mean()
BR20_Bodf = df.loc[(df['well'] == 'BR-20-DG') & (df['contaminant'] == 'Boron')].concentration.mean()
BR20_Rdf = df.loc[(df['well'] == 'BR-20-DG') & (df['contaminant'] == 'Radium 226+228')].concentration.mean()
BR20_Fdf = df.loc[(df['well'] == 'BR-20-DG') & (df['contaminant'] == 'Fluoride')].concentration.mean()
BR20_Chldf = df.loc[(df['well'] == 'BR-20-DG') & (df['contaminant'] == 'Chloride')].concentration.mean()
BR20_Pdf = df.loc[(df['well'] == 'BR-20-DG') & (df['contaminant'] == 'pH')].concentration.mean()
BR20_Caldf = df.loc[(df['well'] == 'BR-20-DG') & (df['contaminant'] == 'Calcium')].concentration.mean()
BR20_Sudf = df.loc[(df['well'] == 'BR-20-DG') & (df['contaminant'] == 'Sulfate')].concentration.mean()
BR20_TDSdf = df.loc[(df['well'] == 'BR-20-DG') & (df['contaminant'] == 'Total Dissolved Solids')].concentration.mean()
BR20_Berdf = df.loc[(df['well'] == 'BR-20-DG') & (df['contaminant'] == 'Beryllium')].concentration.mean()
BR20_Caddf = df.loc[(df['well'] == 'BR-20-DG') & (df['contaminant'] == 'Cadmium')].concentration.mean()
BR20_Sedf = df.loc[(df['well'] == 'BR-20-DG') & (df['contaminant'] == 'Selenium')].concentration.mean()
BR20_Modf = df.loc[(df['well'] == 'BR-20-DG') & (df['contaminant'] == 'Molybdenum')].concentration.mean()
BR20_Codf = df.loc[(df['well'] == 'BR-20-DG') & (df['contaminant'] == 'Cobalt')].concentration.mean()
BR20_Lidf = df.loc[(df['well'] == 'BR-20-DG') & (df['contaminant'] == 'Lithium')].concentration.mean()


BR20_dict = {'mercury_avg': BR20_Medf, 'antimony_avg': BR20_Andf, 'lead_avg': BR20_Ledf, 'arsenic_avg': BR20_Ardf, 'chromium_avg': BR20_Chrdf, 'thallium_avg': BR20_Tdf, 'barium_avg': BR20_Badf, 'boron_avg': BR20_Bodf, 'radium_avg': BR20_Rdf, 'fluoride_avg': BR20_Fdf, 'chloride_avg': BR20_Chldf, 'pH_avg': BR20_Pdf, 'calcium_avg': BR20_Caldf, 'sulfate_avg': BR20_Sudf, 'TDS_avg': BR20_TDSdf, 'beryllium_avg': BR20_Berdf, 'cadmium_avg': BR20_Caddf, 'selenium_avg': BR20_Sedf, 'molybdenum_avg': BR20_Modf, 'cobalt_avg': BR20_Codf, 'lithium_avg': BR20_Lidf}
BR20_dict

#is there a way to make 20 a var x and make a function you can just plug in for

{'mercury_avg': 5.624999999999999e-07,
 'antimony_avg': 0.045375,
 'lead_avg': 0.005,
 'arsenic_avg': 0.0052499999999999995,
 'chromium_avg': 0.005125,
 'thallium_avg': 0.007675000000000001,
 'barium_avg': 1.6662500000000002,
 'boron_avg': 1.3988888888888888,
 'radium_avg': 1.4975,
 'fluoride_avg': 0.32222222222222224,
 'chloride_avg': 20.08888888888889,
 'pH_avg': 7.573333333333333,
 'calcium_avg': 23.11111111111111,
 'sulfate_avg': 13.555555555555555,
 'TDS_avg': 684.4444444444445,
 'beryllium_avg': 0.00475,
 'cadmium_avg': 0.005,
 'selenium_avg': 0.005,
 'molybdenum_avg': 0.01,
 'cobalt_avg': 0.049999999999999996,
 'lithium_avg': 0.049999999999999996}

In [22]:
BR13_Medf = df.loc[(df['well'] == 'BR-13-DG') & (df['contaminant'] == 'Mercury')].concentration.mean()
BR13_Andf = df.loc[(df['well'] == 'BR-13-DG') & (df['contaminant'] == 'Antimony')].concentration.mean()
BR13_Ledf = df.loc[(df['well'] == 'BR-13-DG') & (df['contaminant'] == 'Lead')].concentration.mean()
BR13_Ardf = df.loc[(df['well'] == 'BR-13-DG') & (df['contaminant'] == 'Arsenic')].concentration.mean()
BR13_Chrdf = df.loc[(df['well'] == 'BR-13-DG') & (df['contaminant'] == 'Chromium')].concentration.mean()
BR13_Tdf = df.loc[(df['well'] == 'BR-13-DG') & (df['contaminant'] == 'Thallium')].concentration.mean()
BR13_Badf = df.loc[(df['well'] == 'BR-13-DG') & (df['contaminant'] == 'Barium')].concentration.mean()
BR13_Bodf = df.loc[(df['well'] == 'BR-13-DG') & (df['contaminant'] == 'Boron')].concentration.mean()
BR13_Rdf = df.loc[(df['well'] == 'BR-13-DG') & (df['contaminant'] == 'Radium 226+228')].concentration.mean()
BR13_Fdf = df.loc[(df['well'] == 'BR-13-DG') & (df['contaminant'] == 'Fluoride')].concentration.mean()
BR13_Chldf = df.loc[(df['well'] == 'BR-13-DG') & (df['contaminant'] == 'Chloride')].concentration.mean()
BR13_Pdf = df.loc[(df['well'] == 'BR-13-DG') & (df['contaminant'] == 'pH')].concentration.mean()
BR13_Caldf = df.loc[(df['well'] == 'BR-13-DG') & (df['contaminant'] == 'Calcium')].concentration.mean()
BR13_Sudf = df.loc[(df['well'] == 'BR-13-DG') & (df['contaminant'] == 'Sulfate')].concentration.mean()
BR13_TDSdf = df.loc[(df['well'] == 'BR-13-DG') & (df['contaminant'] == 'Total Dissolved Solids')].concentration.mean()
BR13_Berdf = df.loc[(df['well'] == 'BR-13-DG') & (df['contaminant'] == 'Beryllium')].concentration.mean()
BR13_Caddf = df.loc[(df['well'] == 'BR-13-DG') & (df['contaminant'] == 'Cadmium')].concentration.mean()
BR13_Sedf = df.loc[(df['well'] == 'BR-13-DG') & (df['contaminant'] == 'Selenium')].concentration.mean()
BR13_Modf = df.loc[(df['well'] == 'BR-13-DG') & (df['contaminant'] == 'Molybdenum')].concentration.mean()
BR13_Codf = df.loc[(df['well'] == 'BR-13-DG') & (df['contaminant'] == 'Cobalt')].concentration.mean()
BR13_Lidf = df.loc[(df['well'] == 'BR-13-DG') & (df['contaminant'] == 'Lithium')].concentration.mean()


BR13_dict = {'mercury_avg': BR13_Medf, 'antimony_avg': BR13_Andf, 'lead_avg': BR13_Ledf, 'arsenic_avg': BR13_Ardf, 'chromium_avg': BR13_Chrdf, 'thallium_avg': BR13_Tdf, 'barium_avg': BR13_Badf, 'boron_avg': BR13_Bodf, 'radium_avg': BR13_Rdf, 'fluoride_avg': BR13_Fdf, 'chloride_avg': BR13_Chldf, 'pH_avg': BR13_Pdf, 'calcium_avg': BR13_Caldf, 'sulfate_avg': BR13_Sudf, 'TDS_avg': BR13_TDSdf, 'beryllium_avg': BR13_Berdf, 'cadmium_avg': BR13_Caddf, 'selenium_avg': BR13_Sedf, 'molybdenum_avg': BR13_Modf, 'cobalt_avg': BR13_Codf, 'lithium_avg': BR13_Lidf}
BR13_dict

{'mercury_avg': 5.624999999999999e-07,
 'antimony_avg': 0.0455625,
 'lead_avg': 0.005,
 'arsenic_avg': 0.005375,
 'chromium_avg': 0.005,
 'thallium_avg': 0.007925,
 'barium_avg': 0.07375,
 'boron_avg': 0.1961111111111111,
 'radium_avg': 0.46499999999999997,
 'fluoride_avg': 0.2011111111111111,
 'chloride_avg': 7.911111111111111,
 'pH_avg': 7.135555555555557,
 'calcium_avg': 105.0,
 'sulfate_avg': 102.88888888888889,
 'TDS_avg': 554.4444444444445,
 'beryllium_avg': 0.00475,
 'cadmium_avg': 0.005,
 'selenium_avg': 0.005,
 'molybdenum_avg': 0.01,
 'cobalt_avg': 0.049999999999999996,
 'lithium_avg': 0.049999999999999996}

In [23]:
BR3_Medf = df.loc[(df['well'] == 'BR-3-DG') & (df['contaminant'] == 'Mercury')].concentration.mean()
BR3_Andf = df.loc[(df['well'] == 'BR-3-DG') & (df['contaminant'] == 'Antimony')].concentration.mean()
BR3_Ledf = df.loc[(df['well'] == 'BR-3-DG') & (df['contaminant'] == 'Lead')].concentration.mean()
BR3_Ardf = df.loc[(df['well'] == 'BR-3-DG') & (df['contaminant'] == 'Arsenic')].concentration.mean()
BR3_Chrdf = df.loc[(df['well'] == 'BR-3-DG') & (df['contaminant'] == 'Chromium')].concentration.mean()
BR3_Tdf = df.loc[(df['well'] == 'BR-3-DG') & (df['contaminant'] == 'Thallium')].concentration.mean()
BR3_Badf = df.loc[(df['well'] == 'BR-3-DG') & (df['contaminant'] == 'Barium')].concentration.mean()
BR3_Bodf = df.loc[(df['well'] == 'BR-3-DG') & (df['contaminant'] == 'Boron')].concentration.mean()
BR3_Rdf = df.loc[(df['well'] == 'BR-3-DG') & (df['contaminant'] == 'Radium 226+228')].concentration.mean()
BR3_Fdf = df.loc[(df['well'] == 'BR-3-DG') & (df['contaminant'] == 'Fluoride')].concentration.mean()
BR3_Chldf = df.loc[(df['well'] == 'BR-3-DG') & (df['contaminant'] == 'Chloride')].concentration.mean()
BR3_Pdf = df.loc[(df['well'] == 'BR-3-DG') & (df['contaminant'] == 'pH')].concentration.mean()
BR3_Caldf = df.loc[(df['well'] == 'BR-3-DG') & (df['contaminant'] == 'Calcium')].concentration.mean()
BR3_Sudf = df.loc[(df['well'] == 'BR-3-DG') & (df['contaminant'] == 'Sulfate')].concentration.mean()
BR3_TDSdf = df.loc[(df['well'] == 'BR-3-DG') & (df['contaminant'] == 'Total Dissolved Solids')].concentration.mean()
BR3_Berdf = df.loc[(df['well'] == 'BR-3-DG') & (df['contaminant'] == 'Beryllium')].concentration.mean()
BR3_Caddf = df.loc[(df['well'] == 'BR-3-DG') & (df['contaminant'] == 'Cadmium')].concentration.mean()
BR3_Sedf = df.loc[(df['well'] == 'BR-3-DG') & (df['contaminant'] == 'Selenium')].concentration.mean()
BR3_Modf = df.loc[(df['well'] == 'BR-3-DG') & (df['contaminant'] == 'Molybdenum')].concentration.mean()
BR3_Codf = df.loc[(df['well'] == 'BR-3-DG') & (df['contaminant'] == 'Cobalt')].concentration.mean()
BR3_Lidf = df.loc[(df['well'] == 'BR-3-DG') & (df['contaminant'] == 'Lithium')].concentration.mean()


BR3_dict = {'mercury_avg': BR3_Medf, 'antimony_avg': BR3_Andf, 'lead_avg': BR3_Ledf, 'arsenic_avg': BR3_Ardf, 'chromium_avg': BR3_Chrdf, 'thallium_avg': BR3_Tdf, 'barium_avg': BR3_Badf, 'boron_avg': BR3_Bodf, 'radium_avg': BR3_Rdf, 'fluoride_avg': BR3_Fdf, 'chloride_avg': BR3_Chldf, 'pH_avg': BR3_Pdf, 'calcium_avg': BR3_Caldf, 'sulfate_avg': BR3_Sudf, 'TDS_avg': BR3_TDSdf, 'beryllium_avg': BR3_Berdf, 'cadmium_avg': BR3_Caddf, 'selenium_avg': BR3_Sedf, 'molybdenum_avg': BR3_Modf, 'cobalt_avg': BR3_Codf, 'lithium_avg': BR3_Lidf}
BR3_dict

{'mercury_avg': 5.624999999999999e-07,
 'antimony_avg': 0.0457,
 'lead_avg': 0.005125,
 'arsenic_avg': 0.005874999999999999,
 'chromium_avg': 0.005,
 'thallium_avg': 0.007925,
 'barium_avg': 0.03875,
 'boron_avg': 0.09355555555555556,
 'radium_avg': 0.69125,
 'fluoride_avg': 0.22777777777777775,
 'chloride_avg': 57.77777777777778,
 'pH_avg': 7.118888888888888,
 'calcium_avg': 126.33333333333333,
 'sulfate_avg': 155.11111111111111,
 'TDS_avg': 606.1111111111111,
 'beryllium_avg': 0.00475,
 'cadmium_avg': 0.005,
 'selenium_avg': 0.005,
 'molybdenum_avg': 0.01,
 'cobalt_avg': 0.049999999999999996,
 'lithium_avg': 0.049999999999999996}

In [24]:
BR12_Medf = df.loc[(df['well'] == 'BR-12-DG') & (df['contaminant'] == 'Mercury')].concentration.mean()
BR12_Andf = df.loc[(df['well'] == 'BR-12-DG') & (df['contaminant'] == 'Antimony')].concentration.mean()
BR12_Ledf = df.loc[(df['well'] == 'BR-12-DG') & (df['contaminant'] == 'Lead')].concentration.mean()
BR12_Ardf = df.loc[(df['well'] == 'BR-12-DG') & (df['contaminant'] == 'Arsenic')].concentration.mean()
BR12_Chrdf = df.loc[(df['well'] == 'BR-12-DG') & (df['contaminant'] == 'Chromium')].concentration.mean()
BR12_Tdf = df.loc[(df['well'] == 'BR-12-DG') & (df['contaminant'] == 'Thallium')].concentration.mean()
BR12_Badf = df.loc[(df['well'] == 'BR-12-DG') & (df['contaminant'] == 'Barium')].concentration.mean()
BR12_Bodf = df.loc[(df['well'] == 'BR-12-DG') & (df['contaminant'] == 'Boron')].concentration.mean()
BR12_Rdf = df.loc[(df['well'] == 'BR-12-DG') & (df['contaminant'] == 'Radium 226+228')].concentration.mean()
BR12_Fdf = df.loc[(df['well'] == 'BR-12-DG') & (df['contaminant'] == 'Fluoride')].concentration.mean()
BR12_Chldf = df.loc[(df['well'] == 'BR-12-DG') & (df['contaminant'] == 'Chloride')].concentration.mean()
BR12_Pdf = df.loc[(df['well'] == 'BR-12-DG') & (df['contaminant'] == 'pH')].concentration.mean()
BR12_Caldf = df.loc[(df['well'] == 'BR-12-DG') & (df['contaminant'] == 'Calcium')].concentration.mean()
BR12_Sudf = df.loc[(df['well'] == 'BR-12-DG') & (df['contaminant'] == 'Sulfate')].concentration.mean()
BR12_TDSdf = df.loc[(df['well'] == 'BR-12-DG') & (df['contaminant'] == 'Total Dissolved Solids')].concentration.mean()
BR12_Berdf = df.loc[(df['well'] == 'BR-12-DG') & (df['contaminant'] == 'Beryllium')].concentration.mean()
BR12_Caddf = df.loc[(df['well'] == 'BR-12-DG') & (df['contaminant'] == 'Cadmium')].concentration.mean()
BR12_Sedf = df.loc[(df['well'] == 'BR-12-DG') & (df['contaminant'] == 'Selenium')].concentration.mean()
BR12_Modf = df.loc[(df['well'] == 'BR-12-DG') & (df['contaminant'] == 'Molybdenum')].concentration.mean()
BR12_Codf = df.loc[(df['well'] == 'BR-12-DG') & (df['contaminant'] == 'Cobalt')].concentration.mean()
BR12_Lidf = df.loc[(df['well'] == 'BR-12-DG') & (df['contaminant'] == 'Lithium')].concentration.mean()


BR12_dict = {'mercury_avg': BR12_Medf, 'antimony_avg': BR12_Andf, 'lead_avg': BR12_Ledf, 'arsenic_avg': BR12_Ardf, 'chromium_avg': BR12_Chrdf, 'thallium_avg': BR12_Tdf, 'barium_avg': BR12_Badf, 'boron_avg': BR12_Bodf, 'radium_avg': BR12_Rdf, 'fluoride_avg': BR12_Fdf, 'chloride_avg': BR12_Chldf, 'pH_avg': BR12_Pdf, 'calcium_avg': BR12_Caldf, 'sulfate_avg': BR12_Sudf, 'TDS_avg': BR12_TDSdf, 'beryllium_avg': BR12_Berdf, 'cadmium_avg': BR12_Caddf, 'selenium_avg': BR12_Sedf, 'molybdenum_avg': BR12_Modf, 'cobalt_avg': BR12_Codf, 'lithium_avg': BR12_Lidf}
BR12_dict

{'mercury_avg': 5.624999999999999e-07,
 'antimony_avg': 0.045837499999999996,
 'lead_avg': 0.005,
 'arsenic_avg': 0.005625,
 'chromium_avg': 0.01,
 'thallium_avg': 0.008175,
 'barium_avg': 0.0675,
 'boron_avg': 0.13677777777777778,
 'radium_avg': 0.58,
 'fluoride_avg': 0.2933333333333334,
 'chloride_avg': 320.55555555555554,
 'pH_avg': 6.978888888888889,
 'calcium_avg': 187.66666666666666,
 'sulfate_avg': 102.0,
 'TDS_avg': 1026.111111111111,
 'beryllium_avg': 0.00475,
 'cadmium_avg': 0.005,
 'selenium_avg': 0.005,
 'molybdenum_avg': 0.01,
 'cobalt_avg': 0.049999999999999996,
 'lithium_avg': 0.049999999999999996}

In [25]:
MW13_Medf = df.loc[(df['well'] == 'MW-13D') & (df['contaminant'] == 'Mercury')].concentration.mean()
MW13_Andf = df.loc[(df['well'] == 'MW-13D') & (df['contaminant'] == 'Antimony')].concentration.mean()
MW13_Ledf = df.loc[(df['well'] == 'MW-13D') & (df['contaminant'] == 'Lead')].concentration.mean()
MW13_Ardf = df.loc[(df['well'] == 'MW-13D') & (df['contaminant'] == 'Arsenic')].concentration.mean()
MW13_Chrdf = df.loc[(df['well'] == 'MW-13D') & (df['contaminant'] == 'Chromium')].concentration.mean()
MW13_Tdf = df.loc[(df['well'] == 'MW-13D') & (df['contaminant'] == 'Thallium')].concentration.mean()
MW13_Badf = df.loc[(df['well'] == 'MW-13D') & (df['contaminant'] == 'Barium')].concentration.mean()
MW13_Bodf = df.loc[(df['well'] == 'MW-13D') & (df['contaminant'] == 'Boron')].concentration.mean()
MW13_Rdf = df.loc[(df['well'] == 'MW-13D') & (df['contaminant'] == 'Radium 226+228')].concentration.mean()
MW13_Fdf = df.loc[(df['well'] == 'MW-13D') & (df['contaminant'] == 'Fluoride')].concentration.mean()
MW13_Chldf = df.loc[(df['well'] == 'MW-13D') & (df['contaminant'] == 'Chloride')].concentration.mean()
MW13_Pdf = df.loc[(df['well'] == 'MW-13D') & (df['contaminant'] == 'pH')].concentration.mean()
MW13_Caldf = df.loc[(df['well'] == 'MW-13D') & (df['contaminant'] == 'Calcium')].concentration.mean()
MW13_Sudf = df.loc[(df['well'] == 'MW-13D') & (df['contaminant'] == 'Sulfate')].concentration.mean()
MW13_TDSdf = df.loc[(df['well'] == 'MW-13D') & (df['contaminant'] == 'Total Dissolved Solids')].concentration.mean()
MW13_Berdf = df.loc[(df['well'] == 'MW-13D') & (df['contaminant'] == 'Beryllium')].concentration.mean()
MW13_Caddf = df.loc[(df['well'] == 'MW-13D') & (df['contaminant'] == 'Cadmium')].concentration.mean()
MW13_Sedf = df.loc[(df['well'] == 'MW-13D') & (df['contaminant'] == 'Selenium')].concentration.mean()
MW13_Modf = df.loc[(df['well'] == 'MW-13D') & (df['contaminant'] == 'Molybdenum')].concentration.mean()
MW13_Codf = df.loc[(df['well'] == 'MW-13D') & (df['contaminant'] == 'Cobalt')].concentration.mean()
MW13_Lidf = df.loc[(df['well'] == 'MW-13D') & (df['contaminant'] == 'Lithium')].concentration.mean()


MW13_dict = {'mercury_avg': MW13_Medf, 'antimony_avg': MW13_Andf, 'lead_avg': MW13_Ledf, 'arsenic_avg': MW13_Ardf, 'chromium_avg': MW13_Chrdf, 'thallium_avg': MW13_Tdf, 'barium_avg': MW13_Badf, 'boron_avg': MW13_Bodf, 'radium_avg': MW13_Rdf, 'fluoride_avg': MW13_Fdf, 'chloride_avg': MW13_Chldf, 'pH_avg': MW13_Pdf, 'calcium_avg': MW13_Caldf, 'sulfate_avg': MW13_Sudf, 'TDS_avg': MW13_TDSdf, 'beryllium_avg': MW13_Berdf, 'cadmium_avg': MW13_Caddf, 'selenium_avg': MW13_Sedf, 'molybdenum_avg': MW13_Modf, 'cobalt_avg': MW13_Codf, 'lithium_avg': MW13_Lidf}
MW13_dict

{'mercury_avg': 6.25e-07,
 'antimony_avg': 0.0398375,
 'lead_avg': 0.016250000000000004,
 'arsenic_avg': 0.007499999999999999,
 'chromium_avg': 0.0062499999999999995,
 'thallium_avg': 0.007675,
 'barium_avg': 0.012499999999999999,
 'boron_avg': 1.8577777777777778,
 'radium_avg': 0.93375,
 'fluoride_avg': 0.5111111111111112,
 'chloride_avg': 37.333333333333336,
 'pH_avg': 7.62,
 'calcium_avg': 555.5555555555555,
 'sulfate_avg': 1958.888888888889,
 'TDS_avg': 2911.1111111111113,
 'beryllium_avg': 0.00425,
 'cadmium_avg': 0.005,
 'selenium_avg': 0.0062499999999999995,
 'molybdenum_avg': 0.013749999999999998,
 'cobalt_avg': 0.049999999999999996,
 'lithium_avg': 0.06249999999999999}

In [26]:
MW7_Medf = df.loc[(df['well'] == 'MW-7D') & (df['contaminant'] == 'Mercury')].concentration.mean()
MW7_Andf = df.loc[(df['well'] == 'MW-7D') & (df['contaminant'] == 'Antimony')].concentration.mean()
MW7_Ledf = df.loc[(df['well'] == 'MW-7D') & (df['contaminant'] == 'Lead')].concentration.mean()
MW7_Ardf = df.loc[(df['well'] == 'MW-7D') & (df['contaminant'] == 'Arsenic')].concentration.mean()
MW7_Chrdf = df.loc[(df['well'] == 'MW-7D') & (df['contaminant'] == 'Chromium')].concentration.mean()
MW7_Tdf = df.loc[(df['well'] == 'MW-7D') & (df['contaminant'] == 'Thallium')].concentration.mean()
MW7_Badf = df.loc[(df['well'] == 'MW-7D') & (df['contaminant'] == 'Barium')].concentration.mean()
MW7_Bodf = df.loc[(df['well'] == 'MW-7D') & (df['contaminant'] == 'Boron')].concentration.mean()
MW7_Rdf = df.loc[(df['well'] == 'MW-7D') & (df['contaminant'] == 'Radium 226+228')].concentration.mean()
MW7_Fdf = df.loc[(df['well'] == 'MW-7D') & (df['contaminant'] == 'Fluoride')].concentration.mean()
MW7_Chldf = df.loc[(df['well'] == 'MW-7D') & (df['contaminant'] == 'Chloride')].concentration.mean()
MW7_Pdf = df.loc[(df['well'] == 'MW-7D') & (df['contaminant'] == 'pH')].concentration.mean()
MW7_Caldf = df.loc[(df['well'] == 'MW-7D') & (df['contaminant'] == 'Calcium')].concentration.mean()
MW7_Sudf = df.loc[(df['well'] == 'MW-7D') & (df['contaminant'] == 'Sulfate')].concentration.mean()
MW7_TDSdf = df.loc[(df['well'] == 'MW-7D') & (df['contaminant'] == 'Total Dissolved Solids')].concentration.mean()
MW7_Berdf = df.loc[(df['well'] == 'MW-7D') & (df['contaminant'] == 'Beryllium')].concentration.mean()
MW7_Caddf = df.loc[(df['well'] == 'MW-7D') & (df['contaminant'] == 'Cadmium')].concentration.mean()
MW7_Sedf = df.loc[(df['well'] == 'MW-7D') & (df['contaminant'] == 'Selenium')].concentration.mean()
MW7_Modf = df.loc[(df['well'] == 'MW-7D') & (df['contaminant'] == 'Molybdenum')].concentration.mean()
MW7_Codf = df.loc[(df['well'] == 'MW-7D') & (df['contaminant'] == 'Cobalt')].concentration.mean()
MW7_Lidf = df.loc[(df['well'] == 'MW-7D') & (df['contaminant'] == 'Lithium')].concentration.mean()


MW7_dict = {'mercury_avg': MW7_Medf, 'antimony_avg': MW7_Andf, 'lead_avg': MW7_Ledf, 'arsenic_avg': MW7_Ardf, 'chromium_avg': MW7_Chrdf, 'thallium_avg': MW7_Tdf, 'barium_avg': MW7_Badf, 'boron_avg': MW7_Bodf, 'radium_avg': MW7_Rdf, 'fluoride_avg': MW7_Fdf, 'chloride_avg': MW7_Chldf, 'pH_avg': MW7_Pdf, 'calcium_avg': MW7_Caldf, 'sulfate_avg': MW7_Sudf, 'TDS_avg': MW7_TDSdf, 'beryllium_avg': MW7_Berdf, 'cadmium_avg': MW7_Caddf, 'selenium_avg': MW7_Sedf, 'molybdenum_avg': MW7_Modf, 'cobalt_avg': MW7_Codf, 'lithium_avg': MW7_Lidf}
MW7_dict

{'mercury_avg': 6.25e-07,
 'antimony_avg': 0.04725,
 'lead_avg': 0.016250000000000004,
 'arsenic_avg': 0.006999999999999998,
 'chromium_avg': 0.0062499999999999995,
 'thallium_avg': 0.008837500000000002,
 'barium_avg': 0.014999999999999998,
 'boron_avg': 1.402222222222222,
 'radium_avg': 0.5875000000000001,
 'fluoride_avg': 0.6211111111111111,
 'chloride_avg': 5.111111111111111,
 'pH_avg': 7.660000000000001,
 'calcium_avg': 571.2222222222222,
 'sulfate_avg': 1780.0,
 'TDS_avg': 2701.1111111111113,
 'beryllium_avg': 0.004375,
 'cadmium_avg': 0.005,
 'selenium_avg': 0.006874999999999998,
 'molybdenum_avg': 0.013749999999999998,
 'cobalt_avg': 0.049999999999999996,
 'lithium_avg': 0.06249999999999999}

In [27]:
MW11_Medf = df.loc[(df['well'] == 'MW-11D') & (df['contaminant'] == 'Mercury')].concentration.mean()
MW11_Andf = df.loc[(df['well'] == 'MW-11D') & (df['contaminant'] == 'Antimony')].concentration.mean()
MW11_Ledf = df.loc[(df['well'] == 'MW-11D') & (df['contaminant'] == 'Lead')].concentration.mean()
MW11_Ardf = df.loc[(df['well'] == 'MW-11D') & (df['contaminant'] == 'Arsenic')].concentration.mean()
MW11_Chrdf = df.loc[(df['well'] == 'MW-11D') & (df['contaminant'] == 'Chromium')].concentration.mean()
MW11_Tdf = df.loc[(df['well'] == 'MW-11D') & (df['contaminant'] == 'Thallium')].concentration.mean()
MW11_Badf = df.loc[(df['well'] == 'MW-11D') & (df['contaminant'] == 'Barium')].concentration.mean()
MW11_Bodf = df.loc[(df['well'] == 'MW-11D') & (df['contaminant'] == 'Boron')].concentration.mean()
MW11_Rdf = df.loc[(df['well'] == 'MW-11D') & (df['contaminant'] == 'Radium 226+228')].concentration.mean()
MW11_Fdf = df.loc[(df['well'] == 'MW-11D') & (df['contaminant'] == 'Fluoride')].concentration.mean()
MW11_Chldf = df.loc[(df['well'] == 'MW-11D') & (df['contaminant'] == 'Chloride')].concentration.mean()
MW11_Pdf = df.loc[(df['well'] == 'MW-11D') & (df['contaminant'] == 'pH')].concentration.mean()
MW11_Caldf = df.loc[(df['well'] == 'MW-11D') & (df['contaminant'] == 'Calcium')].concentration.mean()
MW11_Sudf = df.loc[(df['well'] == 'MW-11D') & (df['contaminant'] == 'Sulfate')].concentration.mean()
MW11_TDSdf = df.loc[(df['well'] == 'MW-11D') & (df['contaminant'] == 'Total Dissolved Solids')].concentration.mean()
MW11_Berdf = df.loc[(df['well'] == 'MW-11D') & (df['contaminant'] == 'Beryllium')].concentration.mean()
MW11_Caddf = df.loc[(df['well'] == 'MW-11D') & (df['contaminant'] == 'Cadmium')].concentration.mean()
MW11_Sedf = df.loc[(df['well'] == 'MW-11D') & (df['contaminant'] == 'Selenium')].concentration.mean()
MW11_Modf = df.loc[(df['well'] == 'MW-11D') & (df['contaminant'] == 'Molybdenum')].concentration.mean()
MW11_Codf = df.loc[(df['well'] == 'MW-11D') & (df['contaminant'] == 'Cobalt')].concentration.mean()
MW11_Lidf = df.loc[(df['well'] == 'MW-11D') & (df['contaminant'] == 'Lithium')].concentration.mean()


MW11_dict = {'mercury_avg': MW11_Medf, 'antimony_avg': MW11_Andf, 'lead_avg': MW11_Ledf, 'arsenic_avg': MW11_Ardf, 'chromium_avg': MW11_Chrdf, 'thallium_avg': MW11_Tdf, 'barium_avg': MW11_Badf, 'boron_avg': MW11_Bodf, 'radium_avg': MW11_Rdf, 'fluoride_avg': MW11_Fdf, 'chloride_avg': MW11_Chldf, 'pH_avg': MW11_Pdf, 'calcium_avg': MW11_Caldf, 'sulfate_avg': MW11_Sudf, 'TDS_avg': MW11_TDSdf, 'beryllium_avg': MW11_Berdf, 'cadmium_avg': MW11_Caddf, 'selenium_avg': MW11_Sedf, 'molybdenum_avg': MW11_Modf, 'cobalt_avg': MW11_Codf, 'lithium_avg': MW11_Lidf}
MW11_dict

{'mercury_avg': 7.625000000000001e-07,
 'antimony_avg': 0.0401,
 'lead_avg': 0.016250000000000004,
 'arsenic_avg': 0.01225,
 'chromium_avg': 0.007624999999999998,
 'thallium_avg': 0.007925000000000001,
 'barium_avg': 0.03875000000000001,
 'boron_avg': 1.328888888888889,
 'radium_avg': 0.7433333333333333,
 'fluoride_avg': 0.4677777777777778,
 'chloride_avg': 11.555555555555555,
 'pH_avg': 7.486666666666668,
 'calcium_avg': 391.6666666666667,
 'sulfate_avg': 1363.4444444444443,
 'TDS_avg': 2144.4444444444443,
 'beryllium_avg': 0.00425,
 'cadmium_avg': 0.005,
 'selenium_avg': 0.0062499999999999995,
 'molybdenum_avg': 0.013749999999999998,
 'cobalt_avg': 0.049999999999999996,
 'lithium_avg': 0.06249999999999999}

In [28]:
MW14_Medf = df.loc[(df['well'] == 'MW-14D') & (df['contaminant'] == 'Mercury')].concentration.mean()
MW14_Andf = df.loc[(df['well'] == 'MW-14D') & (df['contaminant'] == 'Antimony')].concentration.mean()
MW14_Ledf = df.loc[(df['well'] == 'MW-14D') & (df['contaminant'] == 'Lead')].concentration.mean()
MW14_Ardf = df.loc[(df['well'] == 'MW-14D') & (df['contaminant'] == 'Arsenic')].concentration.mean()
MW14_Chrdf = df.loc[(df['well'] == 'MW-14D') & (df['contaminant'] == 'Chromium')].concentration.mean()
MW14_Tdf = df.loc[(df['well'] == 'MW-14D') & (df['contaminant'] == 'Thallium')].concentration.mean()
MW14_Badf = df.loc[(df['well'] == 'MW-14D') & (df['contaminant'] == 'Barium')].concentration.mean()
MW14_Bodf = df.loc[(df['well'] == 'MW-14D') & (df['contaminant'] == 'Boron')].concentration.mean()
MW14_Rdf = df.loc[(df['well'] == 'MW-14D') & (df['contaminant'] == 'Radium 226+228')].concentration.mean()
MW14_Fdf = df.loc[(df['well'] == 'MW-14D') & (df['contaminant'] == 'Fluoride')].concentration.mean()
MW14_Chldf = df.loc[(df['well'] == 'MW-14D') & (df['contaminant'] == 'Chloride')].concentration.mean()
MW14_Pdf = df.loc[(df['well'] == 'MW-14D') & (df['contaminant'] == 'pH')].concentration.mean()
MW14_Caldf = df.loc[(df['well'] == 'MW-14D') & (df['contaminant'] == 'Calcium')].concentration.mean()
MW14_Sudf = df.loc[(df['well'] == 'MW-14D') & (df['contaminant'] == 'Sulfate')].concentration.mean()
MW14_TDSdf = df.loc[(df['well'] == 'MW-14D') & (df['contaminant'] == 'Total Dissolved Solids')].concentration.mean()
MW14_Berdf = df.loc[(df['well'] == 'MW-14D') & (df['contaminant'] == 'Beryllium')].concentration.mean()
MW14_Caddf = df.loc[(df['well'] == 'MW-14D') & (df['contaminant'] == 'Cadmium')].concentration.mean()
MW14_Sedf = df.loc[(df['well'] == 'MW-14D') & (df['contaminant'] == 'Selenium')].concentration.mean()
MW14_Modf = df.loc[(df['well'] == 'MW-14D') & (df['contaminant'] == 'Molybdenum')].concentration.mean()
MW14_Codf = df.loc[(df['well'] == 'MW-14D') & (df['contaminant'] == 'Cobalt')].concentration.mean()
MW14_Lidf = df.loc[(df['well'] == 'MW-14D') & (df['contaminant'] == 'Lithium')].concentration.mean()


MW14_dict = {'mercury_avg': MW14_Medf, 'antimony_avg': MW14_Andf, 'lead_avg': MW14_Ledf, 'arsenic_avg': MW14_Ardf, 'chromium_avg': MW14_Chrdf, 'thallium_avg': MW14_Tdf, 'barium_avg': MW14_Badf, 'boron_avg': MW14_Bodf, 'radium_avg': MW14_Rdf, 'fluoride_avg': MW14_Fdf, 'chloride_avg': MW14_Chldf, 'pH_avg': MW14_Pdf, 'calcium_avg': MW14_Caldf, 'sulfate_avg': MW14_Sudf, 'TDS_avg': MW14_TDSdf, 'beryllium_avg': MW14_Berdf, 'cadmium_avg': MW14_Caddf, 'selenium_avg': MW14_Sedf, 'molybdenum_avg': MW14_Modf, 'cobalt_avg': MW14_Codf, 'lithium_avg': MW14_Lidf}
MW14_dict

{'mercury_avg': 6.25e-07,
 'antimony_avg': 0.0471875,
 'lead_avg': 0.016250000000000004,
 'arsenic_avg': 0.013124999999999998,
 'chromium_avg': 0.007499999999999999,
 'thallium_avg': 0.008837500000000002,
 'barium_avg': 0.014999999999999998,
 'boron_avg': 1.1055555555555554,
 'radium_avg': 0.8042857142857144,
 'fluoride_avg': 0.3655555555555556,
 'chloride_avg': 35.888888888888886,
 'pH_avg': 7.680000000000001,
 'calcium_avg': 447.8888888888889,
 'sulfate_avg': 1577.7777777777778,
 'TDS_avg': 2370.0,
 'beryllium_avg': 0.004375,
 'cadmium_avg': 0.005,
 'selenium_avg': 0.006375,
 'molybdenum_avg': 0.014749999999999997,
 'cobalt_avg': 0.049999999999999996,
 'lithium_avg': 0.06249999999999999}

In [29]:
MW12_Medf = df.loc[(df['well'] == 'MW-12D') & (df['contaminant'] == 'Mercury')].concentration.mean()
MW12_Andf = df.loc[(df['well'] == 'MW-12D') & (df['contaminant'] == 'Antimony')].concentration.mean()
MW12_Ledf = df.loc[(df['well'] == 'MW-12D') & (df['contaminant'] == 'Lead')].concentration.mean()
MW12_Ardf = df.loc[(df['well'] == 'MW-12D') & (df['contaminant'] == 'Arsenic')].concentration.mean()
MW12_Chrdf = df.loc[(df['well'] == 'MW-12D') & (df['contaminant'] == 'Chromium')].concentration.mean()
MW12_Tdf = df.loc[(df['well'] == 'MW-12D') & (df['contaminant'] == 'Thallium')].concentration.mean()
MW12_Badf = df.loc[(df['well'] == 'MW-12D') & (df['contaminant'] == 'Barium')].concentration.mean()
MW12_Bodf = df.loc[(df['well'] == 'MW-12D') & (df['contaminant'] == 'Boron')].concentration.mean()
MW12_Rdf = df.loc[(df['well'] == 'MW-12D') & (df['contaminant'] == 'Radium 226+228')].concentration.mean()
MW12_Fdf = df.loc[(df['well'] == 'MW-12D') & (df['contaminant'] == 'Fluoride')].concentration.mean()
MW12_Chldf = df.loc[(df['well'] == 'MW-12D') & (df['contaminant'] == 'Chloride')].concentration.mean()
MW12_Pdf = df.loc[(df['well'] == 'MW-12D') & (df['contaminant'] == 'pH')].concentration.mean()
MW12_Caldf = df.loc[(df['well'] == 'MW-12D') & (df['contaminant'] == 'Calcium')].concentration.mean()
MW12_Sudf = df.loc[(df['well'] == 'MW-12D') & (df['contaminant'] == 'Sulfate')].concentration.mean()
MW12_TDSdf = df.loc[(df['well'] == 'MW-12D') & (df['contaminant'] == 'Total Dissolved Solids')].concentration.mean()
MW12_Berdf = df.loc[(df['well'] == 'MW-12D') & (df['contaminant'] == 'Beryllium')].concentration.mean()
MW12_Caddf = df.loc[(df['well'] == 'MW-12D') & (df['contaminant'] == 'Cadmium')].concentration.mean()
MW12_Sedf = df.loc[(df['well'] == 'MW-12D') & (df['contaminant'] == 'Selenium')].concentration.mean()
MW12_Modf = df.loc[(df['well'] == 'MW-12D') & (df['contaminant'] == 'Molybdenum')].concentration.mean()
MW12_Codf = df.loc[(df['well'] == 'MW-12D') & (df['contaminant'] == 'Cobalt')].concentration.mean()
MW12_Lidf = df.loc[(df['well'] == 'MW-12D') & (df['contaminant'] == 'Lithium')].concentration.mean()


MW12_dict = {'mercury_avg': MW12_Medf, 'antimony_avg': MW12_Andf, 'lead_avg': MW12_Ledf, 'arsenic_avg': MW12_Ardf, 'chromium_avg': MW12_Chrdf, 'thallium_avg': MW12_Tdf, 'barium_avg': MW12_Badf, 'boron_avg': MW12_Bodf, 'radium_avg': MW12_Rdf, 'fluoride_avg': MW12_Fdf, 'chloride_avg': MW12_Chldf, 'pH_avg': MW12_Pdf, 'calcium_avg': MW12_Caldf, 'sulfate_avg': MW12_Sudf, 'TDS_avg': MW12_TDSdf, 'beryllium_avg': MW12_Berdf, 'cadmium_avg': MW12_Caddf, 'selenium_avg': MW12_Sedf, 'molybdenum_avg': MW12_Modf, 'cobalt_avg': MW12_Codf, 'lithium_avg': MW12_Lidf}
MW12_dict

{'mercury_avg': 1.225e-06,
 'antimony_avg': 0.0408125,
 'lead_avg': 0.016375000000000004,
 'arsenic_avg': 0.006375,
 'chromium_avg': 0.0062499999999999995,
 'thallium_avg': 0.010300000000000002,
 'barium_avg': 0.0625,
 'boron_avg': 0.6444444444444445,
 'radium_avg': 0.5000000000000001,
 'fluoride_avg': 0.5288888888888889,
 'chloride_avg': 3.888888888888889,
 'pH_avg': 7.4399999999999995,
 'calcium_avg': 105.77777777777777,
 'sulfate_avg': 161.88888888888889,
 'TDS_avg': 770.6666666666666,
 'beryllium_avg': 0.00425,
 'cadmium_avg': 0.005,
 'selenium_avg': 0.0062499999999999995,
 'molybdenum_avg': 0.015124999999999998,
 'cobalt_avg': 0.049999999999999996,
 'lithium_avg': 0.06249999999999999}

In [30]:
CCR4_Medf = df.loc[(df['well'] == 'CCR-4') & (df['contaminant'] == 'Mercury')].concentration.mean()
CCR4_Andf = df.loc[(df['well'] == 'CCR-4') & (df['contaminant'] == 'Antimony')].concentration.mean()
CCR4_Ledf = df.loc[(df['well'] == 'CCR-4') & (df['contaminant'] == 'Lead')].concentration.mean()
CCR4_Ardf = df.loc[(df['well'] == 'CCR-4') & (df['contaminant'] == 'Arsenic')].concentration.mean()
CCR4_Chrdf = df.loc[(df['well'] == 'CCR-4') & (df['contaminant'] == 'Chromium')].concentration.mean()
CCR4_Tdf = df.loc[(df['well'] == 'CCR-4') & (df['contaminant'] == 'Thallium')].concentration.mean()
CCR4_Badf = df.loc[(df['well'] == 'CCR-4') & (df['contaminant'] == 'Barium')].concentration.mean()
CCR4_Bodf = df.loc[(df['well'] == 'CCR-4') & (df['contaminant'] == 'Boron')].concentration.mean()
CCR4_Rdf = df.loc[(df['well'] == 'CCR-4') & (df['contaminant'] == 'Radium 226+228')].concentration.mean()
CCR4_Fdf = df.loc[(df['well'] == 'CCR-4') & (df['contaminant'] == 'Fluoride')].concentration.mean()
CCR4_Chldf = df.loc[(df['well'] == 'CCR-4') & (df['contaminant'] == 'Chloride')].concentration.mean()
CCR4_Pdf = df.loc[(df['well'] == 'CCR-4') & (df['contaminant'] == 'pH')].concentration.mean()
CCR4_Caldf = df.loc[(df['well'] == 'CCR-4') & (df['contaminant'] == 'Calcium')].concentration.mean()
CCR4_Sudf = df.loc[(df['well'] == 'CCR-4') & (df['contaminant'] == 'Sulfate')].concentration.mean()
CCR4_TDSdf = df.loc[(df['well'] == 'CCR-4') & (df['contaminant'] == 'Total Dissolved Solids')].concentration.mean()
CCR4_Berdf = df.loc[(df['well'] == 'CCR-4') & (df['contaminant'] == 'Beryllium')].concentration.mean()
CCR4_Caddf = df.loc[(df['well'] == 'CCR-4') & (df['contaminant'] == 'Cadmium')].concentration.mean()
CCR4_Sedf = df.loc[(df['well'] == 'CCR-4') & (df['contaminant'] == 'Selenium')].concentration.mean()
CCR4_Modf = df.loc[(df['well'] == 'CCR-4') & (df['contaminant'] == 'Molybdenum')].concentration.mean()
CCR4_Codf = df.loc[(df['well'] == 'CCR-4') & (df['contaminant'] == 'Cobalt')].concentration.mean()
CCR4_Lidf = df.loc[(df['well'] == 'CCR-4') & (df['contaminant'] == 'Lithium')].concentration.mean()


CCR4_dict = {'mercury_avg': CCR4_Medf, 'antimony_avg': CCR4_Andf, 'lead_avg': CCR4_Ledf, 'arsenic_avg': CCR4_Ardf, 'chromium_avg': CCR4_Chrdf, 'thallium_avg': CCR4_Tdf, 'barium_avg': CCR4_Badf, 'boron_avg': CCR4_Bodf, 'radium_avg': CCR4_Rdf, 'fluoride_avg': CCR4_Fdf, 'chloride_avg': CCR4_Chldf, 'pH_avg': CCR4_Pdf, 'calcium_avg': CCR4_Caldf, 'sulfate_avg': CCR4_Sudf, 'TDS_avg': CCR4_TDSdf, 'beryllium_avg': CCR4_Berdf, 'cadmium_avg': CCR4_Caddf, 'selenium_avg': CCR4_Sedf, 'molybdenum_avg': CCR4_Modf, 'cobalt_avg': CCR4_Codf, 'lithium_avg': CCR4_Lidf}
CCR4_dict

{'mercury_avg': 7.375000000000001e-07,
 'antimony_avg': 0.04625,
 'lead_avg': 0.016375000000000004,
 'arsenic_avg': 0.009375000000000003,
 'chromium_avg': 0.0062499999999999995,
 'thallium_avg': 0.007675,
 'barium_avg': 0.012499999999999999,
 'boron_avg': 1.5666666666666664,
 'radium_avg': 1.095,
 'fluoride_avg': 0.49444444444444446,
 'chloride_avg': 34.44444444444444,
 'pH_avg': 7.2955555555555565,
 'calcium_avg': 610.8888888888889,
 'sulfate_avg': 1832.2222222222222,
 'TDS_avg': 2856.6666666666665,
 'beryllium_avg': 0.00425,
 'cadmium_avg': 0.005,
 'selenium_avg': 0.006624999999999999,
 'molybdenum_avg': 0.013874999999999998,
 'cobalt_avg': 0.049999999999999996,
 'lithium_avg': 0.06249999999999999}

In [31]:
CCR5_Medf = df.loc[(df['well'] == 'CCR-5') & (df['contaminant'] == 'Mercury')].concentration.mean()
CCR5_Andf = df.loc[(df['well'] == 'CCR-5') & (df['contaminant'] == 'Antimony')].concentration.mean()
CCR5_Ledf = df.loc[(df['well'] == 'CCR-5') & (df['contaminant'] == 'Lead')].concentration.mean()
CCR5_Ardf = df.loc[(df['well'] == 'CCR-5') & (df['contaminant'] == 'Arsenic')].concentration.mean()
CCR5_Chrdf = df.loc[(df['well'] == 'CCR-5') & (df['contaminant'] == 'Chromium')].concentration.mean()
CCR5_Tdf = df.loc[(df['well'] == 'CCR-5') & (df['contaminant'] == 'Thallium')].concentration.mean()
CCR5_Badf = df.loc[(df['well'] == 'CCR-5') & (df['contaminant'] == 'Barium')].concentration.mean()
CCR5_Bodf = df.loc[(df['well'] == 'CCR-5') & (df['contaminant'] == 'Boron')].concentration.mean()
CCR5_Rdf = df.loc[(df['well'] == 'CCR-5') & (df['contaminant'] == 'Radium 226+228')].concentration.mean()
CCR5_Fdf = df.loc[(df['well'] == 'CCR-5') & (df['contaminant'] == 'Fluoride')].concentration.mean()
CCR5_Chldf = df.loc[(df['well'] == 'CCR-5') & (df['contaminant'] == 'Chloride')].concentration.mean()
CCR5_Pdf = df.loc[(df['well'] == 'CCR-5') & (df['contaminant'] == 'pH')].concentration.mean()
CCR5_Caldf = df.loc[(df['well'] == 'CCR-5') & (df['contaminant'] == 'Calcium')].concentration.mean()
CCR5_Sudf = df.loc[(df['well'] == 'CCR-5') & (df['contaminant'] == 'Sulfate')].concentration.mean()
CCR5_TDSdf = df.loc[(df['well'] == 'CCR-5') & (df['contaminant'] == 'Total Dissolved Solids')].concentration.mean()
CCR5_Berdf = df.loc[(df['well'] == 'CCR-5') & (df['contaminant'] == 'Beryllium')].concentration.mean()
CCR5_Caddf = df.loc[(df['well'] == 'CCR-5') & (df['contaminant'] == 'Cadmium')].concentration.mean()
CCR5_Sedf = df.loc[(df['well'] == 'CCR-5') & (df['contaminant'] == 'Selenium')].concentration.mean()
CCR5_Modf = df.loc[(df['well'] == 'CCR-5') & (df['contaminant'] == 'Molybdenum')].concentration.mean()
CCR5_Codf = df.loc[(df['well'] == 'CCR-5') & (df['contaminant'] == 'Cobalt')].concentration.mean()
CCR5_Lidf = df.loc[(df['well'] == 'CCR-5') & (df['contaminant'] == 'Lithium')].concentration.mean()


CCR5_dict = {'mercury_avg': CCR5_Medf, 'antimony_avg': CCR5_Andf, 'lead_avg': CCR5_Ledf, 'arsenic_avg': CCR5_Ardf, 'chromium_avg': CCR5_Chrdf, 'thallium_avg': CCR5_Tdf, 'barium_avg': CCR5_Badf, 'boron_avg': CCR5_Bodf, 'radium_avg': CCR5_Rdf, 'fluoride_avg': CCR5_Fdf, 'chloride_avg': CCR5_Chldf, 'pH_avg': CCR5_Pdf, 'calcium_avg': CCR5_Caldf, 'sulfate_avg': CCR5_Sudf, 'TDS_avg': CCR5_TDSdf, 'beryllium_avg': CCR5_Berdf, 'cadmium_avg': CCR5_Caddf, 'selenium_avg': CCR5_Sedf, 'molybdenum_avg': CCR5_Modf, 'cobalt_avg': CCR5_Codf, 'lithium_avg': CCR5_Lidf}
CCR5_dict

{'mercury_avg': 6.25e-07,
 'antimony_avg': 0.04665,
 'lead_avg': 0.016375000000000004,
 'arsenic_avg': 0.009250000000000001,
 'chromium_avg': 0.0062499999999999995,
 'thallium_avg': 0.007675,
 'barium_avg': 0.014999999999999998,
 'boron_avg': 1.397777777777778,
 'radium_avg': 1.4437499999999999,
 'fluoride_avg': 0.5188888888888888,
 'chloride_avg': 31.0,
 'pH_avg': 7.210000000000002,
 'calcium_avg': 620.7777777777778,
 'sulfate_avg': 1810.0,
 'TDS_avg': 2775.5555555555557,
 'beryllium_avg': 0.00425,
 'cadmium_avg': 0.005,
 'selenium_avg': 0.0062499999999999995,
 'molybdenum_avg': 0.013749999999999998,
 'cobalt_avg': 0.049999999999999996,
 'lithium_avg': 0.06249999999999999}

In [32]:
CCR6_Medf = df.loc[(df['well'] == 'CCR-6') & (df['contaminant'] == 'Mercury')].concentration.mean()
CCR6_Andf = df.loc[(df['well'] == 'CCR-6') & (df['contaminant'] == 'Antimony')].concentration.mean()
CCR6_Ledf = df.loc[(df['well'] == 'CCR-6') & (df['contaminant'] == 'Lead')].concentration.mean()
CCR6_Ardf = df.loc[(df['well'] == 'CCR-6') & (df['contaminant'] == 'Arsenic')].concentration.mean()
CCR6_Chrdf = df.loc[(df['well'] == 'CCR-6') & (df['contaminant'] == 'Chromium')].concentration.mean()
CCR6_Tdf = df.loc[(df['well'] == 'CCR-6') & (df['contaminant'] == 'Thallium')].concentration.mean()
CCR6_Badf = df.loc[(df['well'] == 'CCR-6') & (df['contaminant'] == 'Barium')].concentration.mean()
CCR6_Bodf = df.loc[(df['well'] == 'CCR-6') & (df['contaminant'] == 'Boron')].concentration.mean()
CCR6_Rdf = df.loc[(df['well'] == 'CCR-6') & (df['contaminant'] == 'Radium 226+228')].concentration.mean()
CCR6_Fdf = df.loc[(df['well'] == 'CCR-6') & (df['contaminant'] == 'Fluoride')].concentration.mean()
CCR6_Chldf = df.loc[(df['well'] == 'CCR-6') & (df['contaminant'] == 'Chloride')].concentration.mean()
CCR6_Pdf = df.loc[(df['well'] == 'CCR-6') & (df['contaminant'] == 'pH')].concentration.mean()
CCR6_Caldf = df.loc[(df['well'] == 'CCR-6') & (df['contaminant'] == 'Calcium')].concentration.mean()
CCR6_Sudf = df.loc[(df['well'] == 'CCR-6') & (df['contaminant'] == 'Sulfate')].concentration.mean()
CCR6_TDSdf = df.loc[(df['well'] == 'CCR-6') & (df['contaminant'] == 'Total Dissolved Solids')].concentration.mean()
CCR6_Berdf = df.loc[(df['well'] == 'CCR-6') & (df['contaminant'] == 'Beryllium')].concentration.mean()
CCR6_Caddf = df.loc[(df['well'] == 'CCR-6') & (df['contaminant'] == 'Cadmium')].concentration.mean()
CCR6_Sedf = df.loc[(df['well'] == 'CCR-6') & (df['contaminant'] == 'Selenium')].concentration.mean()
CCR6_Modf = df.loc[(df['well'] == 'CCR-6') & (df['contaminant'] == 'Molybdenum')].concentration.mean()
CCR6_Codf = df.loc[(df['well'] == 'CCR-6') & (df['contaminant'] == 'Cobalt')].concentration.mean()
CCR6_Lidf = df.loc[(df['well'] == 'CCR-6') & (df['contaminant'] == 'Lithium')].concentration.mean()


CCR6_dict = {'mercury_avg': CCR6_Medf, 'antimony_avg': CCR6_Andf, 'lead_avg': CCR6_Ledf, 'arsenic_avg': CCR6_Ardf, 'chromium_avg': CCR6_Chrdf, 'thallium_avg': CCR6_Tdf, 'barium_avg': CCR6_Badf, 'boron_avg': CCR6_Bodf, 'radium_avg': CCR6_Rdf, 'fluoride_avg': CCR6_Fdf, 'chloride_avg': CCR6_Chldf, 'pH_avg': CCR6_Pdf, 'calcium_avg': CCR6_Caldf, 'sulfate_avg': CCR6_Sudf, 'TDS_avg': CCR6_TDSdf, 'beryllium_avg': CCR6_Berdf, 'cadmium_avg': CCR6_Caddf, 'selenium_avg': CCR6_Sedf, 'molybdenum_avg': CCR6_Modf, 'cobalt_avg': CCR6_Codf, 'lithium_avg': CCR6_Lidf}
CCR6_dict

{'mercury_avg': 6.25e-07,
 'antimony_avg': 0.0466875,
 'lead_avg': 0.016625000000000004,
 'arsenic_avg': 0.010250000000000002,
 'chromium_avg': 0.0062499999999999995,
 'thallium_avg': 0.007675,
 'barium_avg': 0.012499999999999999,
 'boron_avg': 1.4555555555555557,
 'radium_avg': 0.8300000000000001,
 'fluoride_avg': 0.4911111111111111,
 'chloride_avg': 28.0,
 'pH_avg': 7.477777777777778,
 'calcium_avg': 619.2222222222222,
 'sulfate_avg': 1808.888888888889,
 'TDS_avg': 2805.5555555555557,
 'beryllium_avg': 0.00425,
 'cadmium_avg': 0.005,
 'selenium_avg': 0.0062499999999999995,
 'molybdenum_avg': 0.013749999999999998,
 'cobalt_avg': 0.049999999999999996,
 'lithium_avg': 0.06249999999999999}

In [33]:
CCR3_Medf = df.loc[(df['well'] == 'CCR-3') & (df['contaminant'] == 'Mercury')].concentration.mean()
CCR3_Andf = df.loc[(df['well'] == 'CCR-3') & (df['contaminant'] == 'Antimony')].concentration.mean()
CCR3_Ledf = df.loc[(df['well'] == 'CCR-3') & (df['contaminant'] == 'Lead')].concentration.mean()
CCR3_Ardf = df.loc[(df['well'] == 'CCR-3') & (df['contaminant'] == 'Arsenic')].concentration.mean()
CCR3_Chrdf = df.loc[(df['well'] == 'CCR-3') & (df['contaminant'] == 'Chromium')].concentration.mean()
CCR3_Tdf = df.loc[(df['well'] == 'CCR-3') & (df['contaminant'] == 'Thallium')].concentration.mean()
CCR3_Badf = df.loc[(df['well'] == 'CCR-3') & (df['contaminant'] == 'Barium')].concentration.mean()
CCR3_Bodf = df.loc[(df['well'] == 'CCR-3') & (df['contaminant'] == 'Boron')].concentration.mean()
CCR3_Rdf = df.loc[(df['well'] == 'CCR-3') & (df['contaminant'] == 'Radium 226+228')].concentration.mean()
CCR3_Fdf = df.loc[(df['well'] == 'CCR-3') & (df['contaminant'] == 'Fluoride')].concentration.mean()
CCR3_Chldf = df.loc[(df['well'] == 'CCR-3') & (df['contaminant'] == 'Chloride')].concentration.mean()
CCR3_Pdf = df.loc[(df['well'] == 'CCR-3') & (df['contaminant'] == 'pH')].concentration.mean()
CCR3_Caldf = df.loc[(df['well'] == 'CCR-3') & (df['contaminant'] == 'Calcium')].concentration.mean()
CCR3_Sudf = df.loc[(df['well'] == 'CCR-3') & (df['contaminant'] == 'Sulfate')].concentration.mean()
CCR3_TDSdf = df.loc[(df['well'] == 'CCR-3') & (df['contaminant'] == 'Total Dissolved Solids')].concentration.mean()
CCR3_Berdf = df.loc[(df['well'] == 'CCR-3') & (df['contaminant'] == 'Beryllium')].concentration.mean()
CCR3_Caddf = df.loc[(df['well'] == 'CCR-3') & (df['contaminant'] == 'Cadmium')].concentration.mean()
CCR3_Sedf = df.loc[(df['well'] == 'CCR-3') & (df['contaminant'] == 'Selenium')].concentration.mean()
CCR3_Modf = df.loc[(df['well'] == 'CCR-3') & (df['contaminant'] == 'Molybdenum')].concentration.mean()
CCR3_Codf = df.loc[(df['well'] == 'CCR-3') & (df['contaminant'] == 'Cobalt')].concentration.mean()
CCR3_Lidf = df.loc[(df['well'] == 'CCR-3') & (df['contaminant'] == 'Lithium')].concentration.mean()


CCR3_dict = {'mercury_avg': CCR3_Medf, 'antimony_avg': CCR3_Andf, 'lead_avg': CCR3_Ledf, 'arsenic_avg': CCR3_Ardf, 'chromium_avg': CCR3_Chrdf, 'thallium_avg': CCR3_Tdf, 'barium_avg': CCR3_Badf, 'boron_avg': CCR3_Bodf, 'radium_avg': CCR3_Rdf, 'fluoride_avg': CCR3_Fdf, 'chloride_avg': CCR3_Chldf, 'pH_avg': CCR3_Pdf, 'calcium_avg': CCR3_Caldf, 'sulfate_avg': CCR3_Sudf, 'TDS_avg': CCR3_TDSdf, 'beryllium_avg': CCR3_Berdf, 'cadmium_avg': CCR3_Caddf, 'selenium_avg': CCR3_Sedf, 'molybdenum_avg': CCR3_Modf, 'cobalt_avg': CCR3_Codf, 'lithium_avg': CCR3_Lidf}
CCR3_dict

{'mercury_avg': 1.1625e-06,
 'antimony_avg': 0.0472,
 'lead_avg': 0.017,
 'arsenic_avg': 0.008625,
 'chromium_avg': 0.0062499999999999995,
 'thallium_avg': 0.0153,
 'barium_avg': 0.065,
 'boron_avg': 1.2911111111111113,
 'radium_avg': 0.87,
 'fluoride_avg': 0.2044444444444444,
 'chloride_avg': 219.22222222222223,
 'pH_avg': 6.771111111111112,
 'calcium_avg': 468.8888888888889,
 'sulfate_avg': 751.5555555555555,
 'TDS_avg': 2562.222222222222,
 'beryllium_avg': 0.00425,
 'cadmium_avg': 0.005,
 'selenium_avg': 0.0062499999999999995,
 'molybdenum_avg': 0.013749999999999998,
 'cobalt_avg': 0.049999999999999996,
 'lithium_avg': 0.06249999999999999}

In [34]:
CCR2_Medf = df.loc[(df['well'] == 'CCR-2') & (df['contaminant'] == 'Mercury')].concentration.mean()
CCR2_Andf = df.loc[(df['well'] == 'CCR-2') & (df['contaminant'] == 'Antimony')].concentration.mean()
CCR2_Ledf = df.loc[(df['well'] == 'CCR-2') & (df['contaminant'] == 'Lead')].concentration.mean()
CCR2_Ardf = df.loc[(df['well'] == 'CCR-2') & (df['contaminant'] == 'Arsenic')].concentration.mean()
CCR2_Chrdf = df.loc[(df['well'] == 'CCR-2') & (df['contaminant'] == 'Chromium')].concentration.mean()
CCR2_Tdf = df.loc[(df['well'] == 'CCR-2') & (df['contaminant'] == 'Thallium')].concentration.mean()
CCR2_Badf = df.loc[(df['well'] == 'CCR-2') & (df['contaminant'] == 'Barium')].concentration.mean()
CCR2_Bodf = df.loc[(df['well'] == 'CCR-2') & (df['contaminant'] == 'Boron')].concentration.mean()
CCR2_Rdf = df.loc[(df['well'] == 'CCR-2') & (df['contaminant'] == 'Radium 226+228')].concentration.mean()
CCR2_Fdf = df.loc[(df['well'] == 'CCR-2') & (df['contaminant'] == 'Fluoride')].concentration.mean()
CCR2_Chldf = df.loc[(df['well'] == 'CCR-2') & (df['contaminant'] == 'Chloride')].concentration.mean()
CCR2_Pdf = df.loc[(df['well'] == 'CCR-2') & (df['contaminant'] == 'pH')].concentration.mean()
CCR2_Caldf = df.loc[(df['well'] == 'CCR-2') & (df['contaminant'] == 'Calcium')].concentration.mean()
CCR2_Sudf = df.loc[(df['well'] == 'CCR-2') & (df['contaminant'] == 'Sulfate')].concentration.mean()
CCR2_TDSdf = df.loc[(df['well'] == 'CCR-2') & (df['contaminant'] == 'Total Dissolved Solids')].concentration.mean()
CCR2_Berdf = df.loc[(df['well'] == 'CCR-2') & (df['contaminant'] == 'Beryllium')].concentration.mean()
CCR2_Caddf = df.loc[(df['well'] == 'CCR-2') & (df['contaminant'] == 'Cadmium')].concentration.mean()
CCR2_Sedf = df.loc[(df['well'] == 'CCR-2') & (df['contaminant'] == 'Selenium')].concentration.mean()
CCR2_Modf = df.loc[(df['well'] == 'CCR-2') & (df['contaminant'] == 'Molybdenum')].concentration.mean()
CCR2_Codf = df.loc[(df['well'] == 'CCR-2') & (df['contaminant'] == 'Cobalt')].concentration.mean()
CCR2_Lidf = df.loc[(df['well'] == 'CCR-2') & (df['contaminant'] == 'Lithium')].concentration.mean()


CCR2_dict = {'mercury_avg': CCR2_Medf, 'antimony_avg': CCR2_Andf, 'lead_avg': CCR2_Ledf, 'arsenic_avg': CCR2_Ardf, 'chromium_avg': CCR2_Chrdf, 'thallium_avg': CCR2_Tdf, 'barium_avg': CCR2_Badf, 'boron_avg': CCR2_Bodf, 'radium_avg': CCR2_Rdf, 'fluoride_avg': CCR2_Fdf, 'chloride_avg': CCR2_Chldf, 'pH_avg': CCR2_Pdf, 'calcium_avg': CCR2_Caldf, 'sulfate_avg': CCR2_Sudf, 'TDS_avg': CCR2_TDSdf, 'beryllium_avg': CCR2_Berdf, 'cadmium_avg': CCR2_Caddf, 'selenium_avg': CCR2_Sedf, 'molybdenum_avg': CCR2_Modf, 'cobalt_avg': CCR2_Codf, 'lithium_avg': CCR2_Lidf}
CCR2_dict

{'mercury_avg': 2.224999999999999e-06,
 'antimony_avg': 0.045712499999999996,
 'lead_avg': 0.019375000000000003,
 'arsenic_avg': 0.03175,
 'chromium_avg': 0.007749999999999999,
 'thallium_avg': 0.007675,
 'barium_avg': 0.08250000000000002,
 'boron_avg': 6.915555555555556,
 'radium_avg': 0.6866666666666666,
 'fluoride_avg': 0.42333333333333334,
 'chloride_avg': 31.444444444444443,
 'pH_avg': 8.043333333333333,
 'calcium_avg': 172.66666666666666,
 'sulfate_avg': 340.0,
 'TDS_avg': 816.7777777777778,
 'beryllium_avg': 0.00425,
 'cadmium_avg': 0.005,
 'selenium_avg': 0.0062499999999999995,
 'molybdenum_avg': 0.013749999999999998,
 'cobalt_avg': 0.049999999999999996,
 'lithium_avg': 0.09500000000000003}

In [35]:
CCR1_Medf = df.loc[(df['well'] == 'CCR-1') & (df['contaminant'] == 'Mercury')].concentration.mean()
CCR1_Andf = df.loc[(df['well'] == 'CCR-1') & (df['contaminant'] == 'Antimony')].concentration.mean()
CCR1_Ledf = df.loc[(df['well'] == 'CCR-1') & (df['contaminant'] == 'Lead')].concentration.mean()
CCR1_Ardf = df.loc[(df['well'] == 'CCR-1') & (df['contaminant'] == 'Arsenic')].concentration.mean()
CCR1_Chrdf = df.loc[(df['well'] == 'CCR-1') & (df['contaminant'] == 'Chromium')].concentration.mean()
CCR1_Tdf = df.loc[(df['well'] == 'CCR-1') & (df['contaminant'] == 'Thallium')].concentration.mean()
CCR1_Badf = df.loc[(df['well'] == 'CCR-1') & (df['contaminant'] == 'Barium')].concentration.mean()
CCR1_Bodf = df.loc[(df['well'] == 'CCR-1') & (df['contaminant'] == 'Boron')].concentration.mean()
CCR1_Rdf = df.loc[(df['well'] == 'CCR-1') & (df['contaminant'] == 'Radium 226+228')].concentration.mean()
CCR1_Fdf = df.loc[(df['well'] == 'CCR-1') & (df['contaminant'] == 'Fluoride')].concentration.mean()
CCR1_Chldf = df.loc[(df['well'] == 'CCR-1') & (df['contaminant'] == 'Chloride')].concentration.mean()
CCR1_Pdf = df.loc[(df['well'] == 'CCR-1') & (df['contaminant'] == 'pH')].concentration.mean()
CCR1_Caldf = df.loc[(df['well'] == 'CCR-1') & (df['contaminant'] == 'Calcium')].concentration.mean()
CCR1_Sudf = df.loc[(df['well'] == 'CCR-1') & (df['contaminant'] == 'Sulfate')].concentration.mean()
CCR1_TDSdf = df.loc[(df['well'] == 'CCR-1') & (df['contaminant'] == 'Total Dissolved Solids')].concentration.mean()
CCR1_Berdf = df.loc[(df['well'] == 'CCR-1') & (df['contaminant'] == 'Beryllium')].concentration.mean()
CCR1_Caddf = df.loc[(df['well'] == 'CCR-1') & (df['contaminant'] == 'Cadmium')].concentration.mean()
CCR1_Sedf = df.loc[(df['well'] == 'CCR-1') & (df['contaminant'] == 'Selenium')].concentration.mean()
CCR1_Modf = df.loc[(df['well'] == 'CCR-1') & (df['contaminant'] == 'Molybdenum')].concentration.mean()
CCR1_Codf = df.loc[(df['well'] == 'CCR-1') & (df['contaminant'] == 'Cobalt')].concentration.mean()
CCR1_Lidf = df.loc[(df['well'] == 'CCR-1') & (df['contaminant'] == 'Lithium')].concentration.mean()


CCR1_dict = {'mercury_avg': CCR1_Medf, 'antimony_avg': CCR1_Andf, 'lead_avg': CCR1_Ledf, 'arsenic_avg': CCR1_Ardf, 'chromium_avg': CCR1_Chrdf, 'thallium_avg': CCR1_Tdf, 'barium_avg': CCR1_Badf, 'boron_avg': CCR1_Bodf, 'radium_avg': CCR1_Rdf, 'fluoride_avg': CCR1_Fdf, 'chloride_avg': CCR1_Chldf, 'pH_avg': CCR1_Pdf, 'calcium_avg': CCR1_Caldf, 'sulfate_avg': CCR1_Sudf, 'TDS_avg': CCR1_TDSdf, 'beryllium_avg': CCR1_Berdf, 'cadmium_avg': CCR1_Caddf, 'selenium_avg': CCR1_Sedf, 'molybdenum_avg': CCR1_Modf, 'cobalt_avg': CCR1_Codf, 'lithium_avg': CCR1_Lidf}
CCR1_dict

{'mercury_avg': 7.125000000000001e-07,
 'antimony_avg': 0.04575,
 'lead_avg': 0.035875,
 'arsenic_avg': 0.007499999999999999,
 'chromium_avg': 0.006624999999999999,
 'thallium_avg': 0.030925000000000005,
 'barium_avg': 0.09375000000000003,
 'boron_avg': 0.20666666666666667,
 'radium_avg': 0.73,
 'fluoride_avg': 0.18666666666666665,
 'chloride_avg': 46.0,
 'pH_avg': 8.177777777777777,
 'calcium_avg': 46.111111111111114,
 'sulfate_avg': 39.333333333333336,
 'TDS_avg': 243.44444444444446,
 'beryllium_avg': 0.00425,
 'cadmium_avg': 0.005,
 'selenium_avg': 0.008625,
 'molybdenum_avg': 0.013749999999999998,
 'cobalt_avg': 0.049999999999999996,
 'lithium_avg': 0.06249999999999999}

In [36]:
A2_Medf = df.loc[(df['well'] == 'A-2') & (df['contaminant'] == 'Mercury')].concentration.mean()
A2_Andf = df.loc[(df['well'] == 'A-2') & (df['contaminant'] == 'Antimony')].concentration.mean()
A2_Ledf = df.loc[(df['well'] == 'A-2') & (df['contaminant'] == 'Lead')].concentration.mean()
A2_Ardf = df.loc[(df['well'] == 'A-2') & (df['contaminant'] == 'Arsenic')].concentration.mean()
A2_Chrdf = df.loc[(df['well'] == 'A-2') & (df['contaminant'] == 'Chromium')].concentration.mean()
A2_Tdf = df.loc[(df['well'] == 'A-2') & (df['contaminant'] == 'Thallium')].concentration.mean()
A2_Badf = df.loc[(df['well'] == 'A-2') & (df['contaminant'] == 'Barium')].concentration.mean()
A2_Bodf = df.loc[(df['well'] == 'A-2') & (df['contaminant'] == 'Boron')].concentration.mean()
A2_Rdf = df.loc[(df['well'] == 'A-2') & (df['contaminant'] == 'Radium 226+228')].concentration.mean()
A2_Fdf = df.loc[(df['well'] == 'A-2') & (df['contaminant'] == 'Fluoride')].concentration.mean()
A2_Chldf = df.loc[(df['well'] == 'A-2') & (df['contaminant'] == 'Chloride')].concentration.mean()
A2_Pdf = df.loc[(df['well'] == 'A-2') & (df['contaminant'] == 'pH')].concentration.mean()
A2_Caldf = df.loc[(df['well'] == 'A-2') & (df['contaminant'] == 'Calcium')].concentration.mean()
A2_Sudf = df.loc[(df['well'] == 'A-2') & (df['contaminant'] == 'Sulfate')].concentration.mean()
A2_TDSdf = df.loc[(df['well'] == 'A-2') & (df['contaminant'] == 'Total Dissolved Solids')].concentration.mean()
A2_Berdf = df.loc[(df['well'] == 'A-2') & (df['contaminant'] == 'Beryllium')].concentration.mean()
A2_Caddf = df.loc[(df['well'] == 'A-2') & (df['contaminant'] == 'Cadmium')].concentration.mean()
A2_Sedf = df.loc[(df['well'] == 'A-2') & (df['contaminant'] == 'Selenium')].concentration.mean()
A2_Modf = df.loc[(df['well'] == 'A-2') & (df['contaminant'] == 'Molybdenum')].concentration.mean()
A2_Codf = df.loc[(df['well'] == 'A-2') & (df['contaminant'] == 'Cobalt')].concentration.mean()
A2_Lidf = df.loc[(df['well'] == 'A-2') & (df['contaminant'] == 'Lithium')].concentration.mean()


A2_dict = {'mercury_avg': A2_Medf, 'antimony_avg': A2_Andf, 'lead_avg': A2_Ledf, 'arsenic_avg': A2_Ardf, 'chromium_avg': A2_Chrdf, 'thallium_avg': A2_Tdf, 'barium_avg': A2_Badf, 'boron_avg': A2_Bodf, 'radium_avg': A2_Rdf, 'fluoride_avg': A2_Fdf, 'chloride_avg': A2_Chldf, 'pH_avg': A2_Pdf, 'calcium_avg': A2_Caldf, 'sulfate_avg': A2_Sudf, 'TDS_avg': A2_TDSdf, 'beryllium_avg': A2_Berdf, 'cadmium_avg': A2_Caddf, 'selenium_avg': A2_Sedf, 'molybdenum_avg': A2_Modf, 'cobalt_avg': A2_Codf, 'lithium_avg': A2_Lidf}
A2_dict

{'mercury_avg': 6.25e-07,
 'antimony_avg': 0.045987499999999994,
 'lead_avg': 0.018000000000000002,
 'arsenic_avg': 0.006874999999999999,
 'chromium_avg': 0.006874999999999998,
 'thallium_avg': 0.01105,
 'barium_avg': 0.04000000000000001,
 'boron_avg': 0.7711111111111112,
 'radium_avg': 1.4450000000000003,
 'fluoride_avg': 0.35,
 'chloride_avg': 121.0,
 'pH_avg': 6.962222222222221,
 'calcium_avg': 618.5555555555555,
 'sulfate_avg': 1607.7777777777778,
 'TDS_avg': 2812.222222222222,
 'beryllium_avg': 0.00425,
 'cadmium_avg': 0.005,
 'selenium_avg': 0.0062499999999999995,
 'molybdenum_avg': 0.013749999999999998,
 'cobalt_avg': 0.049999999999999996,
 'lithium_avg': 0.06624999999999999}

In [37]:
df1 = pd.DataFrame([BR14_dict, BR20_dict]).T
df1.columns = ['BR14', 'BR20']

#df1.columns = ['d{}'.format(i) for i, col in enumerate(df1, 1)]    cool but can't be used here

df1

Unnamed: 0,BR14,BR20
mercury_avg,5.625e-07,5.625e-07
antimony_avg,0.0454375,0.045375
lead_avg,0.005,0.005
arsenic_avg,0.005875,0.00525
chromium_avg,0.005,0.005125
thallium_avg,0.007675,0.007675
barium_avg,0.16625,1.66625
boron_avg,0.1784444,1.398889
radium_avg,0.4875,1.4975
fluoride_avg,0.2033333,0.3222222


In [38]:
df1 = pd.DataFrame([BR3_dict, BR12_dict, BR13_dict, BR14_dict, BR20_dict, MW7_dict, MW11_dict, MW12_dict, MW13_dict, MW14_dict, CCR1_dict, CCR2_dict, CCR3_dict, CCR4_dict, CCR5_dict, CCR6_dict, A2_dict], ['BR-3-DG', 'BR-12-DG', 'BR-13-DG', 'BR-14-UG', 'BR-20-DG', 'MW-7D', 'MW-11D', 'MW-12D', 'MW-13D', 'MW-14D', 'CCR-1', 'CCR-2', 'CCR-3', 'CCR-4', 'CCR-5', 'CCR-6', 'A-2'])
df1.columns = ['mercury_avg', 'antimony_avg', 'lead_avg', 'arsenic_avg', 'chromium_avg', 'thallium_avg', 'barium_avg', 'boron_avg', 'radium_avg', 'fluoride_avg', 'chloride_avg', 'pH_avg', 'calcium_avg', 'sulfate_avg', 'TDS_avg', 'beryllium_avg', 'cadmium_avg', 'selenium_avg', 'molybdenum_avg', 'cobalt_avg', 'lithium_avg']

df1 = df1.rename_axis("well id")
df1

#change index to account for wells 

Unnamed: 0_level_0,mercury_avg,antimony_avg,lead_avg,arsenic_avg,chromium_avg,thallium_avg,barium_avg,boron_avg,radium_avg,fluoride_avg,...,pH_avg,calcium_avg,sulfate_avg,TDS_avg,beryllium_avg,cadmium_avg,selenium_avg,molybdenum_avg,cobalt_avg,lithium_avg
well id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
BR-3-DG,5.625e-07,0.0457,0.005125,0.005875,0.005,0.007925,0.03875,0.093556,0.69125,0.227778,...,7.118889,126.333333,155.111111,606.111111,0.00475,0.005,0.005,0.01,0.05,0.05
BR-12-DG,5.625e-07,0.045837,0.005,0.005625,0.01,0.008175,0.0675,0.136778,0.58,0.293333,...,6.978889,187.666667,102.0,1026.111111,0.00475,0.005,0.005,0.01,0.05,0.05
BR-13-DG,5.625e-07,0.045562,0.005,0.005375,0.005,0.007925,0.07375,0.196111,0.465,0.201111,...,7.135556,105.0,102.888889,554.444444,0.00475,0.005,0.005,0.01,0.05,0.05
BR-14-UG,5.625e-07,0.045437,0.005,0.005875,0.005,0.007675,0.16625,0.178444,0.4875,0.203333,...,7.083333,95.222222,108.666667,477.222222,0.00475,0.005,0.005,0.01,0.05,0.05
BR-20-DG,5.625e-07,0.045375,0.005,0.00525,0.005125,0.007675,1.66625,1.398889,1.4975,0.322222,...,7.573333,23.111111,13.555556,684.444444,0.00475,0.005,0.005,0.01,0.05,0.05
MW-7D,6.25e-07,0.04725,0.01625,0.007,0.00625,0.008838,0.015,1.402222,0.5875,0.621111,...,7.66,571.222222,1780.0,2701.111111,0.004375,0.005,0.006875,0.01375,0.05,0.0625
MW-11D,7.625e-07,0.0401,0.01625,0.01225,0.007625,0.007925,0.03875,1.328889,0.743333,0.467778,...,7.486667,391.666667,1363.444444,2144.444444,0.00425,0.005,0.00625,0.01375,0.05,0.0625
MW-12D,1.225e-06,0.040813,0.016375,0.006375,0.00625,0.0103,0.0625,0.644444,0.5,0.528889,...,7.44,105.777778,161.888889,770.666667,0.00425,0.005,0.00625,0.015125,0.05,0.0625
MW-13D,6.25e-07,0.039837,0.01625,0.0075,0.00625,0.007675,0.0125,1.857778,0.93375,0.511111,...,7.62,555.555556,1958.888889,2911.111111,0.00425,0.005,0.00625,0.01375,0.05,0.0625
MW-14D,6.25e-07,0.047188,0.01625,0.013125,0.0075,0.008838,0.015,1.105556,0.804286,0.365556,...,7.68,447.888889,1577.777778,2370.0,0.004375,0.005,0.006375,0.01475,0.05,0.0625


In [56]:
#for gradient column
BR3 = df.loc[(df['well'] == 'BR-3-DG')].gradient.unique()
BR12 = df.loc[(df['well'] == 'BR-12-DG')].gradient.unique()
BR13 = df.loc[(df['well'] == 'BR-13-DG')].gradient.unique()
BR14 = df.loc[(df['well'] == 'BR-14-UG')].gradient.unique()
BR20 = df.loc[(df['well'] == 'BR-20-DG')].gradient.unique()
MW7 = df.loc[(df['well'] == 'MW-7D')].gradient.unique()
MW11 = df.loc[(df['well'] == 'MW-11D')].gradient.unique()
MW12 = df.loc[(df['well'] == 'MW-12D')].gradient.unique()
MW13 = df.loc[(df['well'] == 'MW-13D')].gradient.unique()
MW14 = df.loc[(df['well'] == 'MW-14D')].gradient.unique()
CCR1 = df.loc[(df['well'] == 'CCR-1')].gradient.unique()
CCR2 = df.loc[(df['well'] == 'CCR-2')].gradient.unique()
CCR3 = df.loc[(df['well'] == 'CCR-3')].gradient.unique()
CCR4 = df.loc[(df['well'] == 'CCR-4')].gradient.unique()
CCR5 = df.loc[(df['well'] == 'CCR-5')].gradient.unique()
CCR6 = df.loc[(df['well'] == 'CCR-6')].gradient.unique()
A2 = df.loc[(df['well'] == 'A-2')].gradient.unique()

In [59]:
#for site column
_BR3 = df.loc[(df['well'] == 'BR-3-DG')].site.unique()
_BR12 = df.loc[(df['well'] == 'BR-12-DG')].site.unique()
_BR13 = df.loc[(df['well'] == 'BR-13-DG')].site.unique()
_BR14 = df.loc[(df['well'] == 'BR-14-UG')].site.unique()
_BR20 = df.loc[(df['well'] == 'BR-20-DG')].site.unique()
_MW7 = df.loc[(df['well'] == 'MW-7D')].site.unique()
_MW11 = df.loc[(df['well'] == 'MW-11D')].site.unique()
_MW12 = df.loc[(df['well'] == 'MW-12D')].site.unique()
_MW13 = df.loc[(df['well'] == 'MW-13D')].site.unique()
_MW14 = df.loc[(df['well'] == 'MW-14D')].site.unique()
_CCR1 = df.loc[(df['well'] == 'CCR-1')].site.unique()
_CCR2 = df.loc[(df['well'] == 'CCR-2')].site.unique()
_CCR3 = df.loc[(df['well'] == 'CCR-3')].site.unique()
_CCR4 = df.loc[(df['well'] == 'CCR-4')].site.unique()
_CCR5 = df.loc[(df['well'] == 'CCR-5')].site.unique()
_CCR6 = df.loc[(df['well'] == 'CCR-6')].site.unique()
_A2 = df.loc[(df['well'] == 'A-2')].site.unique()

In [60]:
#for disposal column
__BR3 = df.loc[(df['well'] == 'BR-3-DG')].disposal.unique()
__BR12 = df.loc[(df['well'] == 'BR-12-DG')].disposal.unique()
__BR13 = df.loc[(df['well'] == 'BR-13-DG')].disposal.unique()
__BR14 = df.loc[(df['well'] == 'BR-14-UG')].disposal.unique()
__BR20 = df.loc[(df['well'] == 'BR-20-DG')].disposal.unique()
__MW7 = df.loc[(df['well'] == 'MW-7D')].disposal.unique()
__MW11 = df.loc[(df['well'] == 'MW-11D')].disposal.unique()
__MW12 = df.loc[(df['well'] == 'MW-12D')].disposal.unique()
__MW13 = df.loc[(df['well'] == 'MW-13D')].disposal.unique()
__MW14 = df.loc[(df['well'] == 'MW-14D')].disposal.unique()
__CCR1 = df.loc[(df['well'] == 'CCR-1')].disposal.unique()
__CCR2 = df.loc[(df['well'] == 'CCR-2')].disposal.unique()
__CCR3 = df.loc[(df['well'] == 'CCR-3')].disposal.unique()
__CCR4 = df.loc[(df['well'] == 'CCR-4')].disposal.unique()
__CCR5 = df.loc[(df['well'] == 'CCR-5')].disposal.unique()
__CCR6 = df.loc[(df['well'] == 'CCR-6')].disposal.unique()
__A2 = df.loc[(df['well'] == 'A-2')].disposal.unique()

In [61]:
#series 
gradient = [BR3[0], BR12[0], BR13[0], BR14[0], BR20[0], MW7[0], MW11[0], MW12[0], MW13[0], MW14[0], CCR1[0], CCR2[0], CCR3[0], CCR4[0], CCR5[0], CCR6[0], A2[0]]
site = [_BR3[0], _BR12[0], _BR13[0], _BR14[0], _BR20[0], _MW7[0], _MW11[0], _MW12[0], _MW13[0], _MW14[0], _CCR1[0], _CCR2[0], _CCR3[0], _CCR4[0], _CCR5[0], _CCR6[0], _A2[0]]
disposal = [__BR3[0], __BR12[0], __BR13[0], __BR14[0], __BR20[0], __MW7[0], __MW11[0], __MW12[0], __MW13[0], __MW14[0], __CCR1[0], __CCR2[0], __CCR3[0], __CCR4[0], __CCR5[0], __CCR6[0], __A2[0]]

#type & unit?

In [63]:
df1['gradient'] = gradient
df1['site'] = site
df1['disposal'] = disposal

df1

Unnamed: 0_level_0,mercury_avg,antimony_avg,lead_avg,arsenic_avg,chromium_avg,thallium_avg,barium_avg,boron_avg,radium_avg,fluoride_avg,...,TDS_avg,beryllium_avg,cadmium_avg,selenium_avg,molybdenum_avg,cobalt_avg,lithium_avg,gradient,site,disposal
well id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
BR-3-DG,5.625e-07,0.0457,0.005125,0.005875,0.005,0.007925,0.03875,0.093556,0.69125,0.227778,...,606.111111,0.00475,0.005,0.005,0.01,0.05,0.05,Downgradient,Dunkirk Generating Station,Dunkirk Landfill
BR-12-DG,5.625e-07,0.045837,0.005,0.005625,0.01,0.008175,0.0675,0.136778,0.58,0.293333,...,1026.111111,0.00475,0.005,0.005,0.01,0.05,0.05,Downgradient,Dunkirk Generating Station,Dunkirk Landfill
BR-13-DG,5.625e-07,0.045562,0.005,0.005375,0.005,0.007925,0.07375,0.196111,0.465,0.201111,...,554.444444,0.00475,0.005,0.005,0.01,0.05,0.05,Downgradient,Dunkirk Generating Station,Dunkirk Landfill
BR-14-UG,5.625e-07,0.045437,0.005,0.005875,0.005,0.007675,0.16625,0.178444,0.4875,0.203333,...,477.222222,0.00475,0.005,0.005,0.01,0.05,0.05,Upgradient,Dunkirk Generating Station,Dunkirk Landfill
BR-20-DG,5.625e-07,0.045375,0.005,0.00525,0.005125,0.007675,1.66625,1.398889,1.4975,0.322222,...,684.444444,0.00475,0.005,0.005,0.01,0.05,0.05,Downgradient,Dunkirk Generating Station,Dunkirk Landfill
MW-7D,6.25e-07,0.04725,0.01625,0.007,0.00625,0.008838,0.015,1.402222,0.5875,0.621111,...,2701.111111,0.004375,0.005,0.006875,0.01375,0.05,0.0625,Downgradient,Huntley Generating Station,Huntley Landfill
MW-11D,7.625e-07,0.0401,0.01625,0.01225,0.007625,0.007925,0.03875,1.328889,0.743333,0.467778,...,2144.444444,0.00425,0.005,0.00625,0.01375,0.05,0.0625,Downgradient,Huntley Generating Station,Huntley Landfill
MW-12D,1.225e-06,0.040813,0.016375,0.006375,0.00625,0.0103,0.0625,0.644444,0.5,0.528889,...,770.666667,0.00425,0.005,0.00625,0.015125,0.05,0.0625,Upgradient,Huntley Generating Station,Huntley Landfill
MW-13D,6.25e-07,0.039837,0.01625,0.0075,0.00625,0.007675,0.0125,1.857778,0.93375,0.511111,...,2911.111111,0.00425,0.005,0.00625,0.01375,0.05,0.0625,Downgradient,Huntley Generating Station,Huntley Landfill
MW-14D,6.25e-07,0.047188,0.01625,0.013125,0.0075,0.008838,0.015,1.105556,0.804286,0.365556,...,2370.0,0.004375,0.005,0.006375,0.01475,0.05,0.0625,Downgradient,Huntley Generating Station,Huntley Landfill


In [69]:
###stats
#min, max, range
#avg depending on gradient 

# weighted mean of chemicals to determine overall toxicity in each well

In [85]:
#plot

df1['well'] = df1.index
df1.head()

Unnamed: 0_level_0,mercury_avg,antimony_avg,lead_avg,arsenic_avg,chromium_avg,thallium_avg,barium_avg,boron_avg,radium_avg,fluoride_avg,...,beryllium_avg,cadmium_avg,selenium_avg,molybdenum_avg,cobalt_avg,lithium_avg,gradient,site,disposal,well
well id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
BR-3-DG,5.625e-07,0.0457,0.005125,0.005875,0.005,0.007925,0.03875,0.093556,0.69125,0.227778,...,0.00475,0.005,0.005,0.01,0.05,0.05,Downgradient,Dunkirk Generating Station,Dunkirk Landfill,BR-3-DG
BR-12-DG,5.625e-07,0.045837,0.005,0.005625,0.01,0.008175,0.0675,0.136778,0.58,0.293333,...,0.00475,0.005,0.005,0.01,0.05,0.05,Downgradient,Dunkirk Generating Station,Dunkirk Landfill,BR-12-DG
BR-13-DG,5.625e-07,0.045562,0.005,0.005375,0.005,0.007925,0.07375,0.196111,0.465,0.201111,...,0.00475,0.005,0.005,0.01,0.05,0.05,Downgradient,Dunkirk Generating Station,Dunkirk Landfill,BR-13-DG
BR-14-UG,5.625e-07,0.045437,0.005,0.005875,0.005,0.007675,0.16625,0.178444,0.4875,0.203333,...,0.00475,0.005,0.005,0.01,0.05,0.05,Upgradient,Dunkirk Generating Station,Dunkirk Landfill,BR-14-UG
BR-20-DG,5.625e-07,0.045375,0.005,0.00525,0.005125,0.007675,1.66625,1.398889,1.4975,0.322222,...,0.00475,0.005,0.005,0.01,0.05,0.05,Downgradient,Dunkirk Generating Station,Dunkirk Landfill,BR-20-DG


In [98]:
alt.Chart(df1).mark_bar().encode(x='well', y='mercury_avg', color='gradient')
 
#clrs = ['blue' if (df1['gradient'] == 'Downgradient') else 'red']
#sb.barplot(x=idx, y=values, palette=clrs) # color=clrs)

In [113]:
#radioactive chemical - really bad if over 5 pCi/L

alt.Chart(df1).mark_bar().encode(x='well', y=alt.Y('radium_avg', scale=alt.Scale(domain=(0, 5))), color='gradient')

In [112]:
#pH ranges from 0-14 su (acidic < 7 < basic)
#normal range for groundwater systems is 6-8.5 su

alt.Chart(df1).mark_bar().encode(x='well', y=alt.Y('pH_avg', scale=alt.Scale(domain=(0, 14))), color='gradient')

In [114]:
alt.Chart(df1).mark_bar().encode(x='well', y='arsenic_avg', color='gradient')

In [115]:
alt.Chart(df1).mark_bar().encode(x='well', y='selenium_avg', color='gradient')

In [116]:
alt.Chart(df1).mark_bar().encode(x='well', y='fluoride_avg', color='gradient')