# Process Electricity Consumption

In [1]:
import numpy as np
import pandas as pd

In [4]:
file_path = "../City_Data/GRU_Electric_Data_byJulian/"

premises_df             = pd.read_csv(file_path + "PREMISE.csv")
contracts_df            = pd.read_csv(file_path + "CONTRACT.csv")
installations_df        = pd.read_csv(file_path + "INSTALL.csv")
consumption_df          = pd.read_csv(file_path + "CONSUMPTION.csv")
contract_accounts_df    = pd.read_csv(file_path + "CONTRACT_ACCOUNT.csv")
business_partners_df    = pd.read_csv(file_path + "BUSINESS_PARTNER.csv")
dunning_disconnects_df  = pd.read_csv(file_path + "DUNNING_DISCONNECTS.csv")

# Non-residential contract accounts
non_res_contract_accounts_df = contract_accounts_df[contract_accounts_df['CA_TYPE']=='NR']

# Non-residential contracts
business_contracts_df = contracts_df[contracts_df['CA'].isin(non_res_contract_accounts_df['CA'])]

# Non-residential installs
business_intalls_df = installations_df[installations_df['INSTALL'].isin(business_contracts_df['INSTALL'])]

# Non-residential premises
non_res_premises_df = premises_df[premises_df['PREMISE'].isin(business_intalls_df['PREMISE'])]
non_res_premises_df = non_res_premises_df[(non_res_premises_df['PREMISETYPE'] != 'XTELE') & 
                                          (non_res_premises_df['PREMISETYPE'] != 'RCMUSE')]

# Non-residential consumption
business_consumption_df = consumption_df[consumption_df['CONTRACT'].isin(business_contracts_df['CONTRACT'])]

** Electricity consumption for businesses **

In [5]:
def get_year_and_month(date):
    parts = date.split('/')
    global years, months
    try:
        years.append(int(parts[0]))
        months.append(int(parts[1]))
    except:
        years.append(0)
        months.append(0)

In [6]:
business_contracts_df[:1]

Unnamed: 0,INSTALL,CONTRACT,CA,STARTDATE,ENDDATE
0,5000059000.0,4000332116,200023567634,20070425,20070916


In [7]:
contract_accounts_df[:1]

Unnamed: 0,CA,BP,CA_TYPE,MAILINGADDRESS,MCITY,MREGION,MPOST_CODE,MCOUNTRY
0,200058060632,1000226073,R,12525 SW 11TH AVE,NEWBERRY,FL,32669-3059,US


In [8]:
business_partners_df[:1]

Unnamed: 0,BP,BP_TYPE,FIRST_NAME,LAST_NAME
0,1000091673,1,GABRIELE,HEIN


In [9]:
business_consumption_df[:1]

Unnamed: 0,CONTRACT,CONSUMPTION,UNIT,BILLINGPERIOD,BILLSTARTDATE,BILLENDDATE
142674,4001746555,653,KWH,2017/02,20170128,20170224


In [10]:
installations_df[:1]

Unnamed: 0,INSTALL,PREMISE,INSTALLTYPE,ZZCODE
0,5000001433,7000050491,ELEC,


In [11]:
# Get rid of bad data
bad_values = [
    np.nan,
    '00000-000-000',
    '55555-555-555',
    '66666-666-666',
    '77777-777-777',
    '88888-888-888',
    '99999-999-999',
    'UFCAM-PUS-000',
    'UFCAM-PUS-XXX'
]

premises_df['PARCEL'] = premises_df['PARCEL'] \
    .drop(axis='index', labels=premises_df.index[premises_df['PARCEL'].isin(bad_values)]) \
    .apply(lambda x: x.replace('-', ''))

# Merge datasets around "CONTRACT"
contract_details_df = business_contracts_df \
    .merge(contract_accounts_df[['CA', 'BP']], on='CA', how='inner') \
    .merge(business_partners_df[['BP', 'FIRST_NAME', 'LAST_NAME']], on='BP', how='inner') \
    .merge(business_consumption_df[['CONTRACT', 'CONSUMPTION', 'UNIT', 'BILLINGPERIOD']], on='CONTRACT', how='inner') \
    .merge(installations_df[installations_df['INSTALLTYPE'] == 'ELEC'][['INSTALL', 'PREMISE']], on='INSTALL', how='inner') \
    .merge(premises_df[['PREMISE', 'PARCEL']], on='PREMISE', how='inner')[[
#         'INSTALL',
#         'CONTRACT',
#         'FIRST_NAME',
#         'LAST_NAME',
        'CONSUMPTION',
        'BILLINGPERIOD',
        'PARCEL'
    ]]

contract_details_df

Unnamed: 0,CONSUMPTION,BILLINGPERIOD,PARCEL
0,11,2007/06,08230004015
1,0,2007/05,08230004015
2,19,2007/07,08230004015
3,399,2007/08,08230004015
4,1227,2007/09,08230004015
5,189,2007/09,08230004015
6,16,2013/06,09013005027
7,34,2013/05,09013005027
8,11,2013/04,09013005027
9,57,2013/06,09013005027


In [50]:
years = []
months = []
business_consumption['BILLINGPERIOD'].apply(get_year_and_month)
business_consumption['BILLINGYEAR'] = years
business_consumption['BILLINGMONTH'] = months

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: http://pandas.pydata.org/pandas-docs/stable/indexing.html#indexing-view-versus-copy
  after removing the cwd from sys.path.
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: http://pandas.pydata.org/pandas-docs/stable/indexing.html#indexing-view-versus-copy
  """


In [51]:
tempo = pd.merge(business_consumption, business_contracts, how='inner')
tempo.head()

Unnamed: 0,CONTRACT,CONSUMPTION,UNIT,BILLINGPERIOD,BILLSTARTDATE,BILLENDDATE,BILLINGYEAR,BILLINGMONTH,INSTALL,CA,STARTDATE,ENDDATE
0,4001746555,653,KWH,2017/02,20170128,20170224,2017,2,5000366000.0,200039280927,20160830,99991231
1,4001746555,1030,KWH,2017/03,20170225,20170329,2017,3,5000366000.0,200039280927,20160830,99991231
2,4001746555,943,KWH,2017/04,20170330,20170426,2017,4,5000366000.0,200039280927,20160830,99991231
3,4001746555,917,KWH,2017/05,20170427,20170526,2017,5,5000366000.0,200039280927,20160830,99991231
4,4001746555,839,KWH,2017/06,20170527,20170628,2017,6,5000366000.0,200039280927,20160830,99991231


In [52]:
electricity_cons_premisewise = pd.merge(tempo, business_intalls, how='inner')

In [53]:
# ACTIVE BUSINESS DATAFRAME
act_bus = pd.read_csv('../Active_Businesses_with_parcel.csv')

In [173]:
act_bus[act_bus['Parcel'] == '06013004008']

Unnamed: 0.1,Unnamed: 0,id,Business_Type,Name,Start_Date,Address,Latitude,Longitude,Parcel
1132,1132,1133,CONTRACTOR-ELECTRICAL,"DELTA TECHNOLOGIES, INC",01/10/2000 12:00:00 AM,"7010 NW 23RD WAY, SUITE B",29.718,-82.356516,6013004008
1816,1816,1817,MANUFACTURING NOT LISTED SEPARATELY,"AFRICAN FORMULA COSMETICS, INC",04/28/2015 12:00:00 AM,"7010 NW 23RD WAY, STE #A",29.718,-82.356516,6013004008


#### GRU Electricity consumption for each active business – Merge Active Businesse

In [67]:
electricity_cons_premisewise.head()

Unnamed: 0,CONTRACT,CONSUMPTION,UNIT,BILLINGPERIOD,BILLSTARTDATE,BILLENDDATE,BILLINGYEAR,BILLINGMONTH,INSTALL,CA,STARTDATE,ENDDATE,PREMISE,INSTALLTYPE,ZZCODE
0,4001746555,653,KWH,2017/02,20170128,20170224,2017,2,5000370000.0,200039280927,20160830,99991231,7000095215,FIT,
1,4001746555,1030,KWH,2017/03,20170225,20170329,2017,3,5000370000.0,200039280927,20160830,99991231,7000095215,FIT,
2,4001746555,943,KWH,2017/04,20170330,20170426,2017,4,5000370000.0,200039280927,20160830,99991231,7000095215,FIT,
3,4001746555,917,KWH,2017/05,20170427,20170526,2017,5,5000370000.0,200039280927,20160830,99991231,7000095215,FIT,
4,4001746555,839,KWH,2017/06,20170527,20170628,2017,6,5000370000.0,200039280927,20160830,99991231,7000095215,FIT,


In [56]:
elec_demo = electricity_cons_premisewise.merge(non_res_premises,how='inner',on='PREMISE')

In [68]:
elec_demo.head()["PARCEL"]

0    16241-003-000
1    16241-003-000
2    16241-003-000
3    16241-003-000
4    16241-003-000
Name: PARCEL, dtype: object

In [74]:
elec_demo['PARCEL'] = elec_demo['PARCEL'].apply(lambda x: x.replace('-','') if type(x) == str else x)

In [58]:
#elec_demo.set_index(['PARCEL','CONTRACT','INSTALL','BILLINGYEAR','BILLINGMONTH'])

In [87]:
elec_consuption_gnv = act_bus[['Name','Parcel']].dropna(subset=['Parcel']).merge(elec_demo[['PARCEL','CONSUMPTION','BILLINGYEAR']].dropna(subset=['PARCEL']), how='left', left_on='Parcel', right_on='PARCEL')#.set_index(['Parcel','BILLINGYEAR', 'BILLINGMONTH'])

In [155]:
exp = elec_consuption_gnv.dropna(subset=['Parcel','PARCEL']).sort_values(by=['Parcel','BILLINGYEAR'])

In [133]:
import locale
from locale import atof
locale.setlocale(locale.LC_NUMERIC, '')

'en_US.UTF-8'

In [157]:
def stringToFloat(x):
    if(type(x)==str):
        return atof(x)
    return x

In [158]:
exp['CONSUMPTION'] = exp['CONSUMPTION'].apply(stringToFloat)

In [162]:
elec_cons_parcel = exp[['Name','Parcel','BILLINGYEAR','CONSUMPTION']].groupby(['Name','Parcel','BILLINGYEAR'],as_index=False).mean()

In [164]:
writer = pd.ExcelWriter('ELectricity_consumption_with_parcelinfo.xlsx')
elec_cons_parcel.to_excel(writer, 'Sheet1')
writer.save()

** Disconnects at a given premise **

In [46]:
dunning_demo = dunning_disconnects.merge(business_partners, how='inner').merge(business_contracts).merge(business_intalls).merge(non_res_premises)

In [47]:
dunning_demo.set_index(['PARCEL','PREMISE','CA'])

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,BP,DISCNO,DISC_DATE,BP_TYPE,FIRST_NAME,LAST_NAME,INSTALL,CONTRACT,STARTDATE,ENDDATE,INSTALLTYPE,ZZCODE,SERVICEADDRESS,SCITY,SREGION,SPOST_CODE,SCOUNTRY,TAXJURCODE,PREMISETYPE
PARCEL,PREMISE,CA,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
09925001000,7000017189,200036591094,1000123638,810000265198,20120201,2,,PANFIN INC DBA LIBERTY TAX,5.00011e+09,4000794598,20100511,20120206,ELEC,,1105 N MAIN ST,GAINESVILLE,FL,32601,US,FLALA0004,COTHR
09925001000,7000017189,200043093734,1000168199,810000440944,20150804,1,MINATA,REDDICK,5.00011e+09,4001065977,20120329,20150806,ELEC,,1105 N MAIN ST,GAINESVILLE,FL,32601,US,FLALA0004,COTHR
08796000000,7000064629,200032665830,1000041016,810000130230,20090609,1,JEANNETTE,JOHNSON,5.00025e+09,4000628724,20090326,20110502,REFS,,1020 NW 30TH AVE,GAINESVILLE,FL,32609,US,FLALA0004,RSFD
08796000000,7000064629,200032665830,1000041016,810000130230,20090609,1,JEANNETTE,JOHNSON,5.00025e+09,4000628722,20090326,20110502,WATR,,1020 NW 30TH AVE,GAINESVILLE,FL,32609,US,FLALA0004,RSFD
08796000000,7000064629,200032665830,1000041016,810000130230,20090609,1,JEANNETTE,JOHNSON,5.00025e+09,4000628723,20090326,20110502,WSTU,,1020 NW 30TH AVE,GAINESVILLE,FL,32609,US,FLALA0004,RSFD
08796000000,7000064629,200032665830,1000041016,810000130230,20090609,1,JEANNETTE,JOHNSON,5.00025e+09,4000628659,20090326,20110502,ELEC,,1020 NW 30TH AVE,GAINESVILLE,FL,32609,US,FLALA0004,RSFD
08796000000,7000064629,200032665830,1000041016,810000130230,20090609,1,JEANNETTE,JOHNSON,5.00025e+09,4000628721,20090326,20110502,STRM,,1020 NW 30TH AVE,GAINESVILLE,FL,32609,US,FLALA0004,RSFD
08199046000,7000057079,200035281901,1000063661,810000258335,20111205,1,OTIS,NORWOOD,5.00031e+09,4000739703,20091026,99991231,ELEC,,2926 NE 20TH WAY STE 1,GAINESVILLE,FL,32609,US,FLALA0004,COTHR
08199046000,7000057079,200035281901,1000063661,810000276708,20120517,1,OTIS,NORWOOD,5.00031e+09,4000739703,20091026,99991231,ELEC,,2926 NE 20TH WAY STE 1,GAINESVILLE,FL,32609,US,FLALA0004,COTHR
08199046000,7000057079,200035281901,1000063661,810000268736,20120306,1,OTIS,NORWOOD,5.00031e+09,4000739703,20091026,99991231,ELEC,,2926 NE 20TH WAY STE 1,GAINESVILLE,FL,32609,US,FLALA0004,COTHR


In [50]:
act_bus.merge(dunning_demo, how='left', left_on='Parcel', right_on='PARCEL').set_index(['PREMISE','PARCEL'])

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 0,id,Business_Type,Name,Start_Date,Address,Latitude,Longitude,Parcel,BP,...,ENDDATE,INSTALLTYPE,ZZCODE,SERVICEADDRESS,SCITY,SREGION,SPOST_CODE,SCOUNTRY,TAXJURCODE,PREMISETYPE
PREMISE,PARCEL,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1
,,0,1,AUTO REPAIR GARAGE,"AUTOMOTIVE ELECTRIC SPECIALIST LLC, A",11/01/1991 12:00:00 AM,2948 NE 21ST WAY,29.6800,-82.295278,08199031000,,...,,,,,,,,,,
,,1,2,RETAIL MERCHANT,"ALL TYPE VACUUM CTR, INC",09/14/1995 12:00:00 AM,2225 NW 6TH ST,29.6737,-82.330548,09289000000,,...,,,,,,,,,,
,,2,3,STORAGE WAREHOUSE OR LOT,A-TURNER MVG. & STG. INC.,01/22/1996 12:00:00 AM,1001 NW 53RD AVE,29.7023,-82.335663,07966010004,,...,,,,,,,,,,
7.000072e+09,08199047000,3,4,REPAIRS NOT REQUIRING STATE LICENSE,"A-1 HANDYMAN, INC.",05/01/1978 12:00:00 AM,"3003 NE 19TH DR, STE. 8",29.6801,-82.297795,08199047000,1.000140e+09,...,99991231.0,ELEC,,3003 NE 19TH DR STE 2,GAINESVILLE,FL,32609,US,FLALA0004,COTHR
,,4,5,TRAVEL AGENCY,"AUTO CLUB GROUP INC, THE",09/27/1995 12:00:00 AM,1201 NW 13TH ST,29.6633,-82.338624,09536001000,,...,,,,,,,,,,
,,5,6,CONTRACTOR-HARV CLASS A UNLTD,"AAA REFRIGERATION, INC.",06/01/1991 12:00:00 AM,2908 NE 21ST WAY,29.6791,-82.295936,08199060000,,...,,,,,,,,,,
,,6,7,RETAIL MERCHANT,AAMAC CORP.,12/20/1995 12:00:00 AM,508 NW 8TH AVE,29.6598,-82.330261,09659000000,,...,,,,,,,,,,
,,7,8,RETAIL MERCHANT,"ABC LIQUORS, INC. #79",10/03/1995 12:00:00 AM,5820 NW 34TH BLVD,29.7095,-82.354680,07879005005,,...,,,,,,,,,,
,,8,9,BEAUTY PARLOR,ABOUT HAIR,01/22/1996 12:00:00 AM,4040 NEWBERRY RD,29.6548,-82.386334,,,...,,,,,,,,,,
,,9,10,RETAIL MERCHANT,ACE CASH EXPRESS #3254,01/29/1996 12:00:00 AM,806 WALDO RD,29.6597,-82.306893,,,...,,,,,,,,,,


### Change of contracts at given location – Change of businesses 

In [23]:
tempo1 = business_contracts.merge(business_intalls).merge(non_res_premises)#.set_index(['PREMISE','CA','CONTRACT'])

In [24]:
tempo1

Unnamed: 0,INSTALL,CONTRACT,CA,STARTDATE,ENDDATE,PREMISE,INSTALLTYPE,ZZCODE,SERVICEADDRESS,SCITY,SREGION,SPOST_CODE,SCOUNTRY,TAXJURCODE,PARCEL,PREMISETYPE
0,5.00006e+09,4000332116,200023567634,20070425,20070916,7000014285,ELEC,,1221 NE 28TH AVE,GAINESVILLE,FL,32609,US,FLALA0004,08230-004-015,RSFD
1,5.00025e+09,4000335421,200023695350,20070508,20090629,7000071867,ELEC,,3835 NW 8TH AVE,GAINESVILLE,FL,32605,US,FLALA0004,06487-014-006,RSFD
2,5.00025e+09,4000335424,200023695350,20070508,20090629,7000071867,WATR,,3835 NW 8TH AVE,GAINESVILLE,FL,32605,US,FLALA0004,06487-014-006,RSFD
3,5.00025e+09,4000335425,200023695350,20070508,20090629,7000071867,WSTU,,3835 NW 8TH AVE,GAINESVILLE,FL,32605,US,FLALA0004,06487-014-006,RSFD
4,5.00025e+09,4000335422,200023695350,20070508,20090629,7000071867,NTGS,,3835 NW 8TH AVE,GAINESVILLE,FL,32605,US,FLALA0004,06487-014-006,RSFD
5,5.00025e+09,4000335423,200023695350,20070508,20090629,7000071867,STRM,,3835 NW 8TH AVE,GAINESVILLE,FL,32605,US,FLALA0004,06487-014-006,RSFD
6,5.00025e+09,4000335426,200023695350,20070508,20090629,7000071867,REFS,,3835 NW 8TH AVE,GAINESVILLE,FL,32605,US,FLALA0004,06487-014-006,RSFD
7,5.00034e+09,4000345519,200023673728,20070529,20071211,7000101276,ELEC,,4444 NW 82ND RD,GAINESVILLE,FL,32653,US,FLALA0004,,XTEMP
8,5.00034e+09,4000448934,200023673728,20071212,20080626,7000101276,ELEC,,4444 NW 82ND RD,GAINESVILLE,FL,32653,US,FLALA0004,,XTEMP
9,5.00034e+09,4000348093,200023921985,20070601,20070827,7000097267,ELEC,,4537 NE 16TH TER,GAINESVILLE,FL,32609,US,FLALA0004,08160-010-023,XTEMP


In [25]:
tempo1[tempo1['INSTALLTYPE']=='ELEC'].merge(non_res_contract_acnts).set_index(['PREMISE','CA','CONTRACT'])

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,INSTALL,STARTDATE,ENDDATE,INSTALLTYPE,ZZCODE,SERVICEADDRESS,SCITY,SREGION,SPOST_CODE,SCOUNTRY,TAXJURCODE,PARCEL,PREMISETYPE,BP,CA_TYPE,MAILINGADDRESS,MCITY,MREGION,MPOST_CODE,MCOUNTRY
PREMISE,CA,CONTRACT,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1
7000014285,200023567634,4000332116,5.00006e+09,20070425,20070916,ELEC,,1221 NE 28TH AVE,GAINESVILLE,FL,32609,US,FLALA0004,08230-004-015,RSFD,1000039473,NR,2433 NW 71ST PL,GAINESVILLE,FL,32653-1625,US
7000071867,200023695350,4000335421,5.00025e+09,20070508,20090629,ELEC,,3835 NW 8TH AVE,GAINESVILLE,FL,32605,US,FLALA0004,06487-014-006,RSFD,1000092630,NR,211 W WARREN AVE,LONGWOOD,FL,32750-4108,US
7000101276,200023673728,4000345519,5.00034e+09,20070529,20071211,ELEC,,4444 NW 82ND RD,GAINESVILLE,FL,32653,US,FLALA0004,,XTEMP,1000092491,NR,14785 OLD SAINT AUGUSTINE,JACKSONVILLE,FL,32258-2463,US
7000101276,200023673728,4000448934,5.00034e+09,20071212,20080626,ELEC,,4444 NW 82ND RD,GAINESVILLE,FL,32653,US,FLALA0004,,XTEMP,1000092491,NR,14785 OLD SAINT AUGUSTINE,JACKSONVILLE,FL,32258-2463,US
7000097162,200023673728,4000479502,5.00034e+09,20080324,20080428,ELEC,,4444 NW 82ND RD,GAINESVILLE,FL,32653,US,FLALA0004,06009-010-003,RSFD,1000092491,NR,14785 OLD SAINT AUGUSTINE,JACKSONVILLE,FL,32258-2463,US
7000101317,200023673728,4000448935,5.00035e+09,20071212,20080321,ELEC,,4444 NW 82ND RD,GAINESVILLE,FL,32653,US,FLALA0004,06009-010-003,XTEMP,1000092491,NR,14785 OLD SAINT AUGUSTINE,JACKSONVILLE,FL,32258-2463,US
7000097267,200023921985,4000348093,5.00034e+09,20070601,20070827,ELEC,,4537 NE 16TH TER,GAINESVILLE,FL,32609,US,FLALA0004,08160-010-023,XTEMP,1000006014,NR,4118 NW 69TH ST,GAINESVILLE,FL,32606-4212,US
7000093191,200024148220,4000350533,5.00009e+09,20070608,20070712,ELEC,,2933 SW 35TH PL APT 120,GAINESVILLE,FL,32608,US,FLALA0004,07297-022-020,RMFLRG,1000032805,NR,1325 NW 53RD AVE STE D,GAINESVILLE,FL,32609-6139,US
7000042306,200014123167,4000352707,5.00034e+09,20070609,20080514,ELEC,,4456 NW 82ND RD,GAINESVILLE,FL,32653,US,FLALA0004,06009-010-004,RSFD,1000009221,NR,301 KINGSLEY LAKE DR STE 504,ST AUGUSTINE,FL,32092-3040,US
7000097257,200014123167,4000139228,5.00014e+09,20070407,20080514,ELEC,,4456 NW 82ND RD,GAINESVILLE,FL,32653,US,FLALA0004,,XTEMP,1000009221,NR,301 KINGSLEY LAKE DR STE 504,ST AUGUSTINE,FL,32092-3040,US


** Business Premises not in active businesses **

In [26]:
act_bus = pd.read_csv('../Active_Businesses_with_parcel.csv')

In [27]:
non_res_premises['PARCEL'] = non_res_premises['PARCEL'].apply(lambda x: str(x).replace('-',''))

In [28]:
non_res_premises[non_res_premises['PARCEL'].isin(act_bus['Parcel'])].count()

PREMISE           3367
SERVICEADDRESS    3367
SCITY             3367
SREGION           3367
SPOST_CODE        3367
SCOUNTRY          3367
TAXJURCODE        3367
PARCEL            3367
PREMISETYPE       3338
dtype: int64

In [29]:
# Trying to find installs for a particular premise with address '2930 SW 23RD TER'

business_intalls[business_intalls['PREMISE']==7000124123]    # -- Here Premise number is 7000124123
business_contracts[business_contracts['INSTALL']==5000376194] # For above premise here install no is 5000376194

Unnamed: 0,INSTALL,CONTRACT,CA,STARTDATE,ENDDATE
1210079,5000376000.0,4001305074,200048721249,20131010,99991231


In [30]:
# Trying to find installs for a particular premise with address '2930 SW 23RD TER'

business_intalls[business_intalls['PREMISE']==7000124124] # -- Here Premise number is 7000124124
business_contracts[business_contracts['INSTALL']==5000376195] # For above premise here install no is 5000376195

Unnamed: 0,INSTALL,CONTRACT,CA,STARTDATE,ENDDATE
1210083,5000376000.0,4001305263,200048721350,20131010,99991231


In [None]:
# non_res_contract_acnts[non_res_contract_acnts['CA']==200048721249]

# non_res_contract_acnts[non_res_contract_acnts['CA']==200048904438]

In [101]:
non_res_premises[non_res_premises['SERVICEADDRESS'] == '2930 SW 23RD TER ']

Unnamed: 0,PREMISE,SERVICEADDRESS,SCITY,SREGION,SPOST_CODE,SCOUNTRY,TAXJURCODE,PARCEL,PREMISETYPE
94845,7000124123,2930 SW 23RD TER,GAINESVILLE,FL,32608,US,FLALA0004,07314-000-000,CNOBLD
94846,7000124124,2930 SW 23RD TER,GAINESVILLE,FL,32608,US,FLALA0004,07314-000-000,CNOBLD
96495,7000123951,2930 SW 23RD TER,GAINESVILLE,FL,32608,US,FLALA0004,07314-000-000,CNOBLD
96547,7000124221,2930 SW 23RD TER,GAINESVILLE,FL,32608,US,FLALA0004,07314-000-000,CNOBLD
96548,7000124222,2930 SW 23RD TER,GAINESVILLE,FL,32608,US,FLALA0004,07314-000-000,CNOBLD
96549,7000124223,2930 SW 23RD TER,GAINESVILLE,FL,32608,US,FLALA0004,07314-000-000,CNOBLD
96553,7000124229,2930 SW 23RD TER,GAINESVILLE,FL,32608,US,FLALA0004,07314-000-000,CNOBLD
96555,7000124300,2930 SW 23RD TER,GAINESVILLE,FL,32608,US,FLALA0004,07314-000-000,CNOBLD
96556,7000124301,2930 SW 23RD TER,GAINESVILLE,FL,32608,US,FLALA0004,07314-000-000,CNOBLD


In [179]:
business_dunning_disconnects = dunning_disconnects[dunning_disconnects['CA'].isin(business_contracts['CA'])]

In [182]:
business_dunning_disconnects

Unnamed: 0,BP,CA,DISCNO,DISC_DATE
0,1000123638,200036591094,810000265198,20120201
433,1000051933,200012249956,810000068502,20080430
437,1000003144,200012433650,810000072872,20080530
810,1000012073,200044023520,810000300765,20121101
1426,1000037374,200019577702,810000044622,20071108
1514,1000088290,200011903786,810000066818,20080421
1672,1000009822,200031182942,810000122057,20090409
2086,1000124006,200035463066,810000215458,20110111
2415,1000104773,200027089643,810000175895,20100419
2454,1000009612,200014616655,810000224736,20110330


In [186]:
business_contracts[business_contracts['CA'] == 200044023520]

Unnamed: 0,INSTALL,CONTRACT,CA,STARTDATE,ENDDATE
1284272,5000055000.0,4001105785,200044023520,20120711,20130807
1290450,5000055000.0,4001105786,200044023520,20120711,20130807
1295576,5000055000.0,4001105787,200044023520,20120711,20130807


In [188]:
business_contracts[business_contracts['CA'] == 200044023520]['INSTALL'][1284272]

5000055299.0

In [189]:
business_intalls[business_intalls['INSTALL'] == 5000055299]

Unnamed: 0,INSTALL,PREMISE,INSTALLTYPE,ZZCODE
332939,5000055299,7000057245,ELEC,


In [190]:
business_intalls[business_intalls['PREMISE']==7000057245]

Unnamed: 0,INSTALL,PREMISE,INSTALLTYPE,ZZCODE
313438,5000055320,7000057245,WSTU,
318542,5000055313,7000057245,WATR,
319651,5000060108,7000057245,IRRW,
332939,5000055299,7000057245,ELEC,


In [185]:
non_res_contract_acnts[non_res_contract_acnts['CA'] == 200012433650]

Unnamed: 0,CA,BP,CA_TYPE,MAILINGADDRESS,MCITY,MREGION,MPOST_CODE,MCOUNTRY
204398,200012433650,1000003144,NR,501 SE 18TH ST OFC,GAINESVILLE,FL,32641-7455,US


In [159]:
ins[464490]
ab = int(ins[464490])
ab

5000363121

In [162]:
business_intalls[business_intalls['INSTALL'] == ab]

Unnamed: 0,INSTALL,PREMISE,INSTALLTYPE,ZZCODE
372246,5000363121,7000111811,GRUC,


In [128]:
unique_premises = business_intalls['PREMISE'].unique()