# Pre-processing Arizona Allocation data for WaDEQA upload.
Date Updated: 04/06/2020
Purpose:  To pre-process the Arizona data into one master file for simple DataFrame creation and extraction

Useful Links to Data:

The water rights data were obtained from the Arizona Department of Water Resources (ADWR) GIS data: http://gisdata-azwater.opendata.arcgis.com/

Overview of Arizona Groundwater management Code can be found at: http://infoshare.azwater.gov/docushare/dsweb/Get/Document-11348/Groundwater_Code_Overview.pdf

Well Registry (Wells55) csv Data: http://gisdata-azwater.opendata.arcgis.com/datasets/38abfdd1dad4485192d7524f2d37a3eb_0

GWSI Sites csv Data: http://gisdata-azwater.opendata.arcgis.com/datasets/59bfec619a0a4f3f9211a3452ea5e1f2_0

In [1]:
#Needed Libararies
import os
import numpy as np
import pandas as pd
from datetime import datetime
pd.set_option('display.max_columns', 999)  # How to display all columns of a Pandas DataFrame in Jupyter Notebook

In [2]:
#Working Directory and Input File
workingDir = "C:/Users/rjame/Documents/WSWC Documents/MappingStatesDataToWaDE2.0/Arizona/WaterAllocation/RawInputData"
os.chdir(workingDir)

WellRegistry_Input = "Well_Registry_Wells55.csv"
GWSI_Input = "GWSI_Sites.csv"

In [3]:
#Dataframe creation
df_WR = pd.read_csv(WellRegistry_Input, encoding = "ISO-8859-1")
df_GWSI = pd.read_csv(GWSI_Input, encoding = "ISO-8859-1")

#Merge
df = pd.merge(df_WR, df_GWSI, left_on='REGISTRY_ID', right_on='REG_ID', how='inner') #

  interactivity=interactivity, compiler=compiler, result=result)


In [10]:
df

Unnamed: 0,ï»¿X_x,Y_x,OBJECTID_x,PROGRAM,REGISTRY_ID,OWNER_NAME,RGR_PUMP_DATA,WELLTYPE,WELL_TYPE_GROUP,DLIC_NUM,APPROVED,INSTALLED,WELL_DEPTH_x,WATER_LEVEL,CASING_DEPTH,CASING_DIAMETER,CASING_TYPE,PUMP_TYPE,PUMP_POWER,PUMPRATE,TESTEDRATE,DRAW_DOWN,COMPLETION_REPORT_STATUS,DRILL_LOG,WELL_CANCELLED,CADASTRAL,COUNTY,WATERSHED,BASIN_NAME,SUBBASIN_NAME,AMA,QUAD_CODE,WHOLE_TOWNSHIP,HALF_TOWNSHIP,NORTHSOUTH,WHOLE_RANGE,HALF_RANGE,EASTWEST,SECTION,QUARTER_160_ACRE,QACRE160DIR,QUARTER_40_ACRE,QACRE40DIR,QUARTER_10_ACRE,QACRE10DIR,UTM_X_METERS,UTM_Y_METERS,APPLICATION_DATE,ADDRESS1,ADDRESS2,CITY,STATE,ZIP,ZIP4,ï»¿X_y,Y_y,OBJECTID_y,SITE_ID,LOCAL_ID,REG_ID,WELL_TYPE,DD_LAT,DD_LONG,LAT_NAD27,LONG_NAD27,WELL_ALT,WATER_USE,WELL_DEPTH_y,CASE_DIAM,DRILL_DATE,WL_COUNT,LASTWLDATE,WL_DTW,WL_ELEV,SOURCE,IDXBK
0,-109.311508,31.777491,2004,55,87306,"CORONADO NATL FOREST,",NO,EXEMPT,EXEMPT,0.0,,1981-01-01T00:00:00.000Z,153.0,8.0,153.0,6.0,,,ELECTRIC MOTOR < 1 HP,0.0,10.0,117.0,,,,D19030018DAA,COCHISE,WHITE WATER DRAW,WILLCOX,WILLCOX,OUTSIDE OF AMA OR INA,D,19,0.0,S,30,0.0,E,18,D,SE,A,NE,A,NE,659882.4,3517013,1997-09-24,301 W CONGRESS,,TUCSON,AZ,,,-109.311740,31.775933,929,314633109184001,D-19-30 18DAD UNSURV,87306.0,GWSI,31.775833,-109.311111,31 46 33.0,109 18 40.0,6050,DOMESTIC,153.0,6.0,9/21/1981,0,,,,,
1,-111.019265,31.893196,2007,55,87309,FREEPORT-MCMORAN SIERRITA INC.,YES,NON-EXEMPT,NON-EXEMPT,7.0,1981-07-21T00:00:00.000Z,1982-08-26T00:00:00.000Z,1167.0,777.0,1063.0,18.0,,,ELECTRIC MOTOR > 100 HP,1250.0,1250.0,18.0,A,X,Y,D18013004ACC,PIMA,SANTA CRUZ RIVER,TUCSON AMA,UPPER SANTA CRUZ,TUCSON,D,18,0.0,S,13,0.0,E,4,A,NE,C,SW,C,SW,498179.2,3528597,1982-08-25,PO BOX 527,,GREEN VALLEY,AZ,,,-111.019269,31.892310,22293,315332111010701,D-18-13 04ACC2,87309.0,GWSI,31.892222,-111.018611,31 53 32.0,111 1 7.0,3326,MINING,1063.0,30.0,,0,,,,,
2,-110.656327,32.050822,2022,55,87324,"GOODMAN,W A",NO,EXEMPT,EXEMPT,137.0,,1981-06-30T00:00:00.000Z,400.0,168.0,400.0,4.0,,,NO POWER CODE LISTED,0.0,0.0,0.0,,,,D16016012DDA,PIMA,SANTA CRUZ RIVER,TUCSON AMA,UPPER SANTA CRUZ,TUCSON,D,16,0.0,S,16,0.0,E,12,D,SE,D,SE,A,NE,532444.9,3546120,1981-04-02,2309 S CAMINO SECO,,TUCSON,AZ,,,-110.656480,32.050641,18967,320302110392101,D-16-16 12DDA,87324.0,GWSI,32.050556,-110.655833,32 3 2.0,110 39 21.0,3660,UNUSED,400.0,4.0,6/3/1981,2,1/17/1995,114.5,3545.5,,
3,-109.142383,32.136640,2030,55,87332,"SHUMAKER,W R",NO,NON-EXEMPT,NON-EXEMPT,53.0,,1981-01-01T00:00:00.000Z,650.0,170.0,650.0,12.0,,,ELECTRIC MOTOR > 100 HP,600.0,600.0,0.0,,,,D15031011DDA,COCHISE,UPPER GILA RIVER,SAFFORD,SAN SIMON VALLEY,OUTSIDE OF AMA OR INA,D,15,0.0,S,31,0.0,E,11,D,SE,D,SE,A,NE,675215.6,3557092,1997-09-24,PO BOX 217,,SAN SIMON,AZ,,,-109.141181,32.136478,28676,320811109082601,D-15-31 11DDA,87332.0,GWSI,32.136389,-109.140556,32 8 11.0,109 8 26.0,3879,IRRIGATION,650.0,12.0,,3,2/6/2007,238.7,3640.3,,
4,-110.332116,32.058811,2043,55,87345,"RILEY WEST INC,",NO,NON-EXEMPT,NON-EXEMPT,76.0,,1981-01-01T00:00:00.000Z,128.0,45.0,128.0,16.0,,,ELECTRIC MOTOR 6 - 15 HP,0.0,380.0,53.0,,,,D16020008BCC,COCHISE,SAN PEDRO RIVER,UPPER SAN PEDRO,SIERRA VISTA,OUTSIDE OF AMA OR INA,D,16,0.0,S,20,0.0,E,8,B,NW,C,SW,C,SW,563046.5,3547149,1997-09-24,4400 E BROADWAY #811,,TUCSON,AZ,,,-110.331473,32.058974,18386,320332110195101,D-16-20 08BCC,87345.0,GWSI,32.058889,-110.330833,32 3 32.0,110 19 51.0,3425,IRRIGATION,128.0,16.0,,2,2/20/2002,34.4,3390.6,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
24334,-112.244560,34.674876,216258,55,923132,BRYCE ENTERPRISES,NO,EXEMPT,EXEMPT,331.0,2019-06-28T00:00:00.000Z,,220.0,100.0,220.0,5.0,,,,0.0,0.0,,,X,,A15001015DCB,YAVAPAI,AGUA FRIA RIVER,PRESCOTT AMA,UPPER AGUA FRIA,PRESCOTT,A,15,0.0,N,1,0.0,E,15,D,SE,C,SW,B,NW,385982.3,3837693,2019-06-28,3500 WILLOW CREEK RD,,PRESCOTT,AZ,,,-112.243842,34.675362,18353,344031112143801,A-15-01 15DCB2,923132.0,GWSI,34.675333,-112.243111,34 40 31.2,112 14 35.2,5270,DOMESTIC,220.0,7.0,7/22/2019,1,7/22/2019,100.0,5170.0,,
24335,-112.242366,34.674871,216259,55,923133,BRYCE ENTERPRISES,NO,EXEMPT,EXEMPT,331.0,2019-06-28T00:00:00.000Z,,200.0,,19.0,7.0,,,,0.0,0.0,,,X,,A15001015DCA,YAVAPAI,AGUA FRIA RIVER,PRESCOTT AMA,UPPER AGUA FRIA,PRESCOTT,A,15,0.0,N,1,0.0,E,15,D,SE,C,SW,A,NE,386183.3,3837690,2019-06-28,3500 WILLOW CREEK RD,,PRESCOTT,AZ,,,-112.243063,34.675363,24664,344031112143501,A-15-01 15DCA3,923133.0,GWSI,34.675334,-112.242332,34 40 31.2,112 14 32.4,5275,UNUSED,19.0,7.0,7/22/2019,0,,,,,
24336,-112.244560,34.674876,216260,55,923134,DNC DEVELOPMENT LLC,NO,EXEMPT,EXEMPT,331.0,2019-09-19T00:00:00.000Z,,400.0,,400.0,5.0,,,,0.0,0.0,,,X,,A15001015DCB,YAVAPAI,AGUA FRIA RIVER,PRESCOTT AMA,UPPER AGUA FRIA,PRESCOTT,A,15,0.0,N,1,0.0,E,15,D,SE,C,SW,B,NW,385982.3,3837693,2019-06-28,PO BOX 10336,,PRESCOTT,AZ,,,-112.245512,34.675363,30087,344031112144401,A-15-01 15DCB1,923134.0,GWSI,34.675334,-112.244781,34 40 31.2,112 14 41.2,5260,UNUSED,19.0,7.0,7/11/2019,0,,,,,
24337,-112.244560,34.674876,216261,55,923135,DNC DEVELOPMENT LLC,NO,EXEMPT,EXEMPT,331.0,2019-07-01T00:00:00.000Z,,200.0,,19.0,7.0,,,,0.0,0.0,,,X,,A15001015DCB,YAVAPAI,AGUA FRIA RIVER,PRESCOTT AMA,UPPER AGUA FRIA,PRESCOTT,A,15,0.0,N,1,0.0,E,15,D,SE,C,SW,B,NW,385982.3,3837693,2019-07-01,PO BOX 10336,,PRESCOTT,AZ,,,-112.244675,34.675362,37962,344031112144101,A-15-01 15DCB3,923135.0,GWSI,34.675333,-112.243944,34 40 31.2,112 14 38.2,5270,UNUSED,19.0,7.0,7/23/2019,0,,,,,


In [5]:
df.columns

Index(['ï»¿X_x', 'Y_x', 'OBJECTID_x', 'PROGRAM', 'REGISTRY_ID', 'OWNER_NAME',
       'RGR_PUMP_DATA', 'WELLTYPE', 'WELL_TYPE_GROUP', 'DLIC_NUM', 'APPROVED',
       'INSTALLED', 'WELL_DEPTH_x', 'WATER_LEVEL', 'CASING_DEPTH',
       'CASING_DIAMETER', 'CASING_TYPE', 'PUMP_TYPE', 'PUMP_POWER', 'PUMPRATE',
       'TESTEDRATE', 'DRAW_DOWN', 'COMPLETION_REPORT_STATUS', 'DRILL_LOG',
       'WELL_CANCELLED', 'CADASTRAL', 'COUNTY', 'WATERSHED', 'BASIN_NAME',
       'SUBBASIN_NAME', 'AMA', 'QUAD_CODE', 'WHOLE_TOWNSHIP', 'HALF_TOWNSHIP',
       'NORTHSOUTH', 'WHOLE_RANGE', 'HALF_RANGE', 'EASTWEST', 'SECTION',
       'QUARTER_160_ACRE', 'QACRE160DIR', 'QUARTER_40_ACRE', 'QACRE40DIR',
       'QUARTER_10_ACRE', 'QACRE10DIR', 'UTM_X_METERS', 'UTM_Y_METERS',
       'APPLICATION_DATE', 'ADDRESS1', 'ADDRESS2', 'CITY', 'STATE', 'ZIP',
       'ZIP4', 'ï»¿X_y', 'Y_y', 'OBJECTID_y', 'SITE_ID', 'LOCAL_ID', 'REG_ID',
       'WELL_TYPE', 'DD_LAT', 'DD_LONG', 'LAT_NAD27', 'LONG_NAD27', 'WELL_ALT',
       'WATER

In [6]:
with pd.option_context('display.max_rows', None, 'display.max_columns', None):
    print(df.dtypes)

ï»¿X_x                      float64
Y_x                         float64
OBJECTID_x                    int64
PROGRAM                       int64
REGISTRY_ID                   int64
OWNER_NAME                   object
RGR_PUMP_DATA                object
WELLTYPE                     object
WELL_TYPE_GROUP              object
DLIC_NUM                    float64
APPROVED                     object
INSTALLED                    object
WELL_DEPTH_x                float64
WATER_LEVEL                 float64
CASING_DEPTH                float64
CASING_DIAMETER             float64
CASING_TYPE                 float64
PUMP_TYPE                   float64
PUMP_POWER                   object
PUMPRATE                    float64
TESTEDRATE                  float64
DRAW_DOWN                   float64
COMPLETION_REPORT_STATUS     object
DRILL_LOG                    object
WELL_CANCELLED               object
CADASTRAL                    object
COUNTY                       object
WATERSHED                   

In [7]:
#Changing datatype of used date fields. 
df['APPLICATION_DATE'] = pd.to_datetime(df['APPLICATION_DATE'], errors = 'coerce')
df['APPLICATION_DATE'] = pd.to_datetime(df["APPLICATION_DATE"].dt.strftime('%m/%d/%Y'))

In [8]:
#Removing NaN, and missing (999) values from AllocaitonAmount, AllocaitonMaxium
df['PUMPRATE'] = df['PUMPRATE'].fillna(0)
df['PUMPRATE'] = df['PUMPRATE'].replace(999, 0)

df['TESTEDRATE'] = df['TESTEDRATE'].fillna(0)
df['TESTEDRATE'] = df['TESTEDRATE'].replace(999, 0)

In [9]:
#Exporting to Finished File
df.to_csv('P_ArizonaMaster.csv', index=False)  # The output