In [31]:
import pandas as pd
import geopandas as gpd
from shapely import Point
from math import radians, cos, sin, asin, sqrt
import dask.dataframe as dd

In [32]:
# radius that is used as a limit of distance between two sets of coordinates
RADIUS_KM = 0.3048

## Functions & File Load In

In [33]:
# function to calculuate distance between 2 sets of coordinates

def haversine(lon1, lat1, lon2, lat2):
    """
    Calculate the great circle distance in kilometers between two points 
    on the earth (specified in decimal degrees)
    """
    # convert decimal degrees to radians 
    lon1, lat1, lon2, lat2 = map(radians, [lon1, lat1, lon2, lat2])

    # haversine formula 
    dlon = lon2 - lon1 
    dlat = lat2 - lat1 
    a = sin(dlat/2)**2 + cos(lat1) * cos(lat2) * sin(dlon/2)**2
    c = 2 * asin(sqrt(a)) 
    r = 6371 # Radius of earth in kilometers. Use 3956 for miles. Determines return value units.
    # print("Distance:", c * r)
    return c * r

In [34]:
"""
funtion will take 4 inputs. infogroup_df & counterglow_df2 are the dataframes being analyzed.
the third input is the specific state that we are choosing to analyze
the fourth input is the threshold distance. this distance is the max allowable distance between 2
datapoints. the output is a dataframe that in each row, we have a datapoint that represents a
datapoint from infogroup and (x distance away) a farm spotted in the counterglow data. we are
speculating that it is possible for a spotted farm in counterglow to not have the most precise address
and actually exist in the Infogroup data, but with slightly different longitude and latitude
"""

def potential_farms(infogroup_df, counterglow_df, two_letter_state, max_dist_km ):
    
    # ruduce dataframe to only consist rows with specified two_letter_state
    infogroup_state_df      = infogroup_df[infogroup_df["STATE"] == two_letter_state]
    counterglow_state_df    = counterglow_df[counterglow_df["State"] == two_letter_state]
    
    # create two new empty dataframe that we will be adding to when match is found
    infogroup_trim     = pd.DataFrame(columns=infogroup_state_df.columns)
    counterglow_trim   = pd.DataFrame(columns=counterglow_state_df.columns)
    
    counter = 0 # to counter matches, can print to terminal if desired
    for i in range(len(infogroup_state_df)):
        
        infogroup_longitude  = infogroup_state_df.iloc[i]["LONGITUDE"]  # get longitude
        infogroup_latitude   = infogroup_state_df.iloc[i]["LATITUDE"]   # get latitude
        
        for j in range(len(counterglow_state_df)):
            
            counterglow_latitude    = counterglow_state_df.iloc[j]["Lat"]    # get latitude
            counterglow_longitude   = counterglow_state_df.iloc[j]["Lat.1"]  # get longitude
            
            dist_km                 = haversine(infogroup_longitude, infogroup_latitude, 
                                                counterglow_longitude, counterglow_latitude)
            
            if(dist_km <= max_dist_km): # if the distance is <= the max distance set in function
                counter += 1
            
                infogroup_trim.loc[len(infogroup_trim.index)]      = infogroup_state_df.iloc[i]
                counterglow_trim.loc[len(counterglow_trim.index)]  = counterglow_state_df.iloc[j]
        
    # change the name of the columns for Latitude & Longitude in each dataframe
    # for Infogroup Dataframe
    infogroup_trim      = infogroup_trim.rename(columns={'LATITUDE': 'LATITUDE 1', 
                                                        'LONGITUDE': 'LONGITUDE 1'})
    counterglow_trim    = counterglow_trim.rename(columns={'Lat' : 'LATITUDE 2',
                                                           'Lat.1': 'LONGITUDE 2'})
    
    # print to terminal to let user know there were matches found
    if(counter !=0):
        print(two_letter_state + ":", "Total number of matches:", counter)
                
    return infogroup_trim, counterglow_trim   
    

In [35]:
"""
function take a dataframe and a list of states. This function calls the function 'potential_farms'
if the two dataframes returned from 'potential_farms' are NOT empty, they are added to the dictionaries
the keys for the dictionaries are the STATE in the current iteration (in the for loop) and the values
are the dataframes associated with the state. This function will return two dictionaries

This function POTENTIAL_FARMS function
"""

def infogroup_counterglow_dict(sic_df, counterglow_df, list_of_states, radium_km):
    # empty dictionaries
    igroup_sic_dict = {}
    ctrglow_dict = {}

    # loop through states list and use those as keys to match with the dataframe that was output 
    for state in range(len(list_of_states)):
        infogroup_matches, counterglow_matches = potential_farms(sic_df, counterglow_df, list_of_states[state], radium_km)
        
        # set up key value pairing for both dictionaries
        # only adding to dictionaries if there are matches
        if( (len(infogroup_matches)!=0) & (len(counterglow_matches)!=0) ):
            igroup_sic_dict[list_of_states[state]]    = infogroup_matches
            ctrglow_dict[list_of_states[state]]       = counterglow_matches
            
    return igroup_sic_dict, ctrglow_dict


In [36]:
"""
fucntion will take a dataframe and trim off all columns, only leaving:
Company, address line 1, city, state, zipcode, primary sic code, sic code 1, sic code 2, sic code 3, sic code 4,
"""

def keep_certain_columns(dict):
    for key in dict:
        dict[key] = dict[key][['COMPANY', 'ADDRESS LINE 1', 'CITY', 'STATE', 'ZIPCODE', 'PRIMARY SIC CODE', 'SIC6_DESCRIPTIONS',
                'PRIMARY NAICS CODE', 'NAICS8 DESCRIPTIONS', 'SIC CODE', 'SIC6_DESCRIPTIONS (SIC)',
                'SIC CODE 1', 'SIC6_DESCRIPTIONS (SIC1)', 'SIC CODE 2', 'SIC6_DESCRIPTIONS(SIC2)',
                'SIC CODE 3', 'SIC6_DESCRIPTIONS(SIC3)', 'SIC CODE 4', 'SIC6_DESCRIPTIONS(SIC4)', 'PARENT NUMBER']]
    
    return dict


In [37]:
# function that take a dictionary, the keys are STATES (2 letter) and the VALUES are a dataframe
# containing the locations that are close to a counterglow location

def list_of_dataframes(infogroup_dict, master_list):
    
    # loop through each key in the dictinary (each state in this case)
    for key in infogroup_dict.keys():
        # drop the duplicate rows and then add the trimmed dataframe to master_list
        master_list.append(infogroup_dict[key].drop_duplicates())
        
    return master_list

In [38]:
# load counterglow dataset
df_counterglow = pd.read_csv("../data/Counterglow+Facility+List+Complete.csv")

In [39]:
# filter counterglow dataset to have poultry/chicken only

# Chickens & Other Birds (Meat)
# Chickens (Meat)

df_counterglow_poultry = df_counterglow[(df_counterglow['Farm Type'] == 'Chickens & Other Birds (Meat)') |
                                        (df_counterglow['Farm Type'] == 'Chickens (Meat)')]


In [40]:
states = ['IA', 'OK', 'MO', 'OK', 'AL', 'LA', 'MS', 'IL', 'IN', 'OH', 'KY', 'TN', 'AR', 'NC', 'SC', 'GA']

In [41]:
all_df_list = []

## SIC Code 0291 Exploration: General Farms, Primarily Livestock and Animal Specialties.

In [42]:
# To see how many matches exist within the dataframe consisting of SIC Codes containing 0291
df_sic_0291 = pd.read_csv("../data/code_0291.csv")
  
igroup_sic_0291_dict, ctrglow_0291_dict = infogroup_counterglow_dict(df_sic_0291, df_counterglow_poultry, states, RADIUS_KM)


NC: Total number of matches: 1


In [11]:
# igroup_sic_0291_dict = keep_certain_columns(igroup_sic_0291_dict)

In [43]:
# loop through the infogroup dictionary, each key value matches to a dictionary
# grab the dictionary and append it to all_df_list

all_df_list = list_of_dataframes(igroup_sic_0291_dict, all_df_list)

In [44]:
len(all_df_list)

1

#### Explore

In [None]:
igroup_sic_0291_dict['AL']

In [46]:
igroup_sic_0291_dict['NC']

Unnamed: 0.1,Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,ZIP4,COUNTY CODE,AREA CODE,IDCODE,...,POPULATION CODE,CENSUS TRACT,CENSUS BLOCK,LATITUDE 1,LONGITUDE 1,MATCH CODE,CBSA CODE,CBSA LEVEL,CSA CODE,FIPS CODE
0,11864,LATTAS EGG RANCH INC,1016 GOVERNOR BURKE RD,HILLSBOROUGH,NC,27278,8631.0,135,919,2,...,7,10901.0,1.0,36.103037,-79.086815,P,20500,2.0,450,37135


## SIC Code 0241 Exploration: Dairy Farms

In [48]:
# To see how many matches exist within the dataframe consisting of SIC Codes containing 0241
df_sic_0241 = pd.read_csv("../data/code_0241.csv")
  
igroup_sic_0241_dict, ctrglow_0241_dict = infogroup_counterglow_dict(df_sic_0241, df_counterglow_poultry, states, RADIUS_KM)


OH: Total number of matches: 1
NC: Total number of matches: 1


In [15]:
# igroup_sic_0241_dict = keep_certain_columns(igroup_sic_0241_dict)

In [None]:
# loop through the infogroup dictionary, each key value matches to a dictionary
# grab the dictionary and append it to all_df_list

all_df_list = list_of_dataframes(igroup_sic_0241_dict, all_df_list)

#### Explore

In [16]:
igroup_sic_0241_dict['IN']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,THOMAS BONTRAGER FARM,63666 COUNTY ROAD 37,GOSHEN,IN,46528,19198,GENERAL FARMS-PRIMARILY CROP,11199807.0,ALL OTHER MISCELLANEOUS CROP FARMING,24103.0,DAIRY FARMS,,,,,,,,,


In [17]:
igroup_sic_0241_dict['OH']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,R F & SONS,5629 STATE ROUTE 49,FORT RECOVERY,OH,45846,24103,DAIRY FARMS,11212002.0,DAIRY CATTLE & MILK PRODUCTION,,,,,,,,,,,


In [18]:
igroup_sic_0241_dict['NC']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,FOGLEMAN DAIRY,9144 SYLVAN RD,LIBERTY,NC,27298,24103,DAIRY FARMS,11212002.0,DAIRY CATTLE & MILK PRODUCTION,24101.0,DAIRIES (MILK),,,,,,,,,


## SIC Code 0761 Exploration: Farm Labor

In [12]:
# To see how many matches exist within the dataframe consisting of SIC Codes containing 0761
df_sic_0761 = pd.read_csv("../data/code_0761.csv")
  
igroup_sic_0761_dict, ctrglow_0761_dict = infogroup_counterglow_dict(df_sic_0761, df_counterglow_poultry, states, RADIUS_KM)


In [77]:
# igroup_sic_0761_dict = keep_certain_columns(igroup_sic_0761_dict)

In [None]:
# loop through the infogroup dictionary, each key value matches to a dictionary
# grab the dictionary and append it to all_df_list

all_df_list = list_of_dataframes(igroup_sic_0761_dict, all_df_list)

#### Explore

## SIC Code 0762 Exploration: Farm Mgmt Services

In [13]:
# To see how many matches exist within the dataframe consisting of SIC Codes containing 0762
df_sic_0762 = pd.read_csv("../data/code_0762.csv")
  
igroup_sic_0762_dict, ctrglow_0762_dict = infogroup_counterglow_dict(df_sic_0762, df_counterglow_poultry, states, RADIUS_KM)


MS: Total number of matches: 1


In [21]:
# igroup_sic_0762_dict = keep_certain_columns(igroup_sic_0762_dict)

In [None]:
# loop through the infogroup dictionary, each key value matches to a dictionary
# grab the dictionary and append it to all_df_list

all_df_list = list_of_dataframes(igroup_sic_0762_dict, all_df_list)

#### Explore

In [22]:
igroup_sic_0762_dict['MS']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,DAVID SHARP FARM,357 ROBERT BUTLER RD,FOREST,MS,39074,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,76203.0,FARMING SERVICE,,,,,,,,,


In [23]:
igroup_sic_0762_dict['OH']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,SUNRISE CO-OP,5458 STATE ROUTE 49,FORT RECOVERY,OH,45846,519111,FEED-WHOLESALE,42491013.0,FARM SUPPLIES MERCHANT WHOLESALERS,76203.0,FARMING SERVICE,519112.0,FEED-DEALERS (WHLS),,,,,,,5503818.0


## SIC Code 8748 Exploration: Farm Mgmt Systems

In [14]:
# To see how many matches exist within the dataframe consisting of SIC Codes containing 8748
df_sic_8748 = pd.read_csv("../data/code_8748.csv")
  
igroup_sic_8748_dict, ctrglow_8748_dict = infogroup_counterglow_dict(df_sic_8748, df_counterglow_poultry, states, RADIUS_KM)


In [25]:
# igroup_sic_8748_dict = keep_certain_columns(igroup_sic_8748_dict)

In [None]:
# loop through the infogroup dictionary, each key value matches to a dictionary
# grab the dictionary and append it to all_df_list

all_df_list = list_of_dataframes(igroup_sic_8748_dict, all_df_list)

#### Explore

In [26]:
igroup_sic_8748_dict['IA']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,HARBOR GROUP INC,444 12TH ST NE,SIOUX CENTER,IA,51250.0,874899,CONSULTANTS-BUSINESS NEC,54161830.0,OTHER MANAGEMENT CONSULTING SERVICES,874201.0,BUSINESS MANAGEMENT CONSULTANTS,,,,,,,,,


In [27]:
igroup_sic_8748_dict['MO']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,SOUTHWEST AVIATION & MFG LLC,164 ROUTE J,SOUTH WEST CITY,MO,64863.0,559905,AIRCRAFT-DEALERS,44122815.0,"MOTORCYCLE, ATV & ALL OTHER MOTOR VEHICLE DEALERS",874822.0,AVIATION CONSULTANTS,,,,,,,,,


In [28]:
igroup_sic_8748_dict['AL']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,WALMART TECH SVC,1450 N BRINDLEE MOUNTAIN PKWY,ARAB,AL,35016.0,874813,SECURITY SYSTEMS CONSULTANTS,54161813.0,OTHER MANAGEMENT CONSULTING SERVICES,599902.0,CELLULAR TELEPHONES-EQUIPMENT & SUPLS,737904.0,COMPUTERS-NETWORKING,,,,,,,
1,JACKSON ROOFING & REMOLDLING,3324 HIDDEN BROOK CIRCLE,HEADLAND,AL,36345.0,874899,CONSULTANTS-BUSINESS NEC,54161830.0,OTHER MANAGEMENT CONSULTING SERVICES,176111.0,SIDING CONTRACTORS,176109.0,ROOFING CONTRACTORS,,,,,,,
2,SANDERS AVIATION INC,20 ELLIS HAYNES DR,JASPER,AL,35503.0,874822,AVIATION CONSULTANTS,54169074.0,OTHER SCIENTIFIC & TECHNICAL CONSULTING SERVICES,999966.0,FEDERAL GOVERNMENT CONTRACTORS,,,,,,,,,


In [29]:
igroup_sic_8748_dict['MS']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,SOUTHERN INDUSTRIAL TECH,25 COUNTY ROAD 17,STRINGER,MS,39481.0,874836,INDUSTRIAL CONSULTANTS,54132012.0,LANDSCAPE ARCHITECTURAL SERVICES,,,,,,,,,,,
1,FURR & ASSOC,1040 BELT LINE DR NE,BROOKHAVEN,MS,39601.0,874823,COMMUNICATIONS CONSULTANTS,54161814.0,OTHER MANAGEMENT CONSULTING SERVICES,,,,,,,,,,,
2,BEEHIVE HOMES OF PHILADELPHIA,708 COLUMBUS AVE,PHILADELPHIA,MS,39350.0,836105,RESIDENTIAL CARE HOMES,62331206.0,ASSISTED LIVING FACILITIES FOR THE ELDERLY,874859.0,ASSISTED LIVING FACILITY CONSULTANTS,,,,,,,,,


In [30]:
igroup_sic_8748_dict['IL']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,WAGNER CONSULTING-AGRICULTURE,709 OAK ST,LENA,IL,61048.0,874899,CONSULTANTS-BUSINESS NEC,54161830.0,OTHER MANAGEMENT CONSULTING SERVICES,,,,,,,,,,,


In [31]:
igroup_sic_8748_dict['IN']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,DAVITA VINCENNES HOME DIALYSIS,700 WILLOW ST # 102,VINCENNES,IN,47591.0,809203,DIALYSIS,62149202.0,KIDNEY DIALYSIS CENTERS,874802.0,TRAINING CONSULTANTS,829931.0,TRAINING PROGRAMS & SERVICES,801104.0,CLINICS,808201.0,HOME HEALTH SERVICE,,,886835255.0


In [32]:
igroup_sic_8748_dict['AR']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,MORELIA MEXICAN REATSURANT,304 W SUNSET AVE,SPRINGDALE,AR,72764.0,874831,FOOD FACILITIES-CONSULTANTS,54161821.0,OTHER MANAGEMENT CONSULTING SERVICES,581208.0,RESTAURANTS,,,,,,,,,


In [33]:
igroup_sic_8748_dict['NC']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,BLUE RIDGE HOME CONSLNTS INC,144 MARSHALL RD,NEBO,NC,28761.0,874899,CONSULTANTS-BUSINESS NEC,54161830.0,OTHER MANAGEMENT CONSULTING SERVICES,,,,,,,,,,,
1,MULTI COMMUNICATIONS INC,19 COVERT RD,OLD FORT,NC,28762.0,489903,COMMUNICATIONS,51791901.0,ALL OTHER TELECOMMUNICATIONS,874823.0,COMMUNICATIONS CONSULTANTS,,,,,,,,,


## SIC Code 5431 Exploration: Farm Markets

In [15]:
# To see how many matches exist within the dataframe consisting of SIC Codes containing 5431
df_sic_5431 = pd.read_csv("../data/code_5431.csv")
  
igroup_sic_5431_dict, ctrglow_5431_dict = infogroup_counterglow_dict(df_sic_5431, df_counterglow_poultry, states, RADIUS_KM)


IA: Total number of matches: 1


In [35]:
# igroup_sic_5431_dict = keep_certain_columns(igroup_sic_5431_dict)

In [None]:
# loop through the infogroup dictionary, each key value matches to a dictionary
# grab the dictionary and append it to all_df_list

all_df_list = list_of_dataframes(igroup_sic_5431_dict, all_df_list)

#### Exploration

In [36]:
igroup_sic_5431_dict['IA']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,FARMERS FRESH POULTRY,5195 FARMERS AVE SW,KALONA,IA,52247,25401,POULTRY FARMS,11234001.0,POULTRY HATCHERIES,543102.0,FARM MARKETS,,,,,,,,,
1,FLINT RIDGE ORGANIC PRODUCE,1896 110TH ST,KALONA,IA,52247,543101,FRUITS & VEGETABLES & PRODUCE-RETAIL,44523003.0,FRUIT & VEGETABLE MARKETS,,,,,,,,,,,


In [37]:
igroup_sic_5431_dict['AR']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,DEL,1229 W SUNSET AVE,SPRINGDALE,AR,72764,543101,FRUITS & VEGETABLES & PRODUCE-RETAIL,44523003.0,FRUIT & VEGETABLE MARKETS,,,,,,,,,,,
1,DEL REY PRODUCE,1229 W SUNSET AVE,SPRINGDALE,AR,72764,543101,FRUITS & VEGETABLES & PRODUCE-RETAIL,44523003.0,FRUIT & VEGETABLE MARKETS,514803.0,PRODUCE-BROKERS (WHLS),,,,,,,,,


In [38]:
igroup_sic_5431_dict['NC']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,TRADING POST,4500 US HIGHWAY 64 90 W,TAYLORSVILLE,NC,28681,543101,FRUITS & VEGETABLES & PRODUCE-RETAIL,44523003.0,FRUIT & VEGETABLE MARKETS,,,,,,,,,,,


## SIC Code 8611 Exploration: Farm Organizations

In [16]:
# To see how many matches exist within the dataframe consisting of SIC Codes containing 8611
df_sic_8611 = pd.read_csv("../data/code_8611.csv")
  
igroup_sic_8611_dict, ctrglow_8611_dict = infogroup_counterglow_dict(df_sic_8611, df_counterglow_poultry, states, RADIUS_KM)


IL: Total number of matches: 1


In [40]:
# igroup_sic_8611_dict = keep_certain_columns(igroup_sic_8611_dict)

In [None]:
# loop through the infogroup dictionary, each key value matches to a dictionary
# grab the dictionary and append it to all_df_list

all_df_list = list_of_dataframes(igroup_sic_8611_dict, all_df_list)

#### Exploration

In [41]:
igroup_sic_8611_dict['MS']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,FREENY WATER ASSN,1411 HIGHWAY 35 S,CARTHAGE,MS,39051,861102,ASSOCIATIONS,81391002.0,BUSINESS ASSOCIATIONS,,,,,,,,,,,


In [42]:
igroup_sic_8611_dict['IL']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,AMERICAN LEGION HOME,316 W MAIN ST,LENA,IL,61048,864102,VETERANS' & MILITARY ORGANIZATIONS,81341003.0,CIVIL & SOCIAL ORGANIZATIONS,861102.0,ASSOCIATIONS,,,,,,,,,496227620.0


In [43]:
igroup_sic_8611_dict['AR']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,NORTHWEST ARK HM BLDRS ASSN,2022 LONG ST,SPRINGDALE,AR,72764,861102,ASSOCIATIONS,81391002.0,BUSINESS ASSOCIATIONS,,,,,,,,,,,
1,SPRINGDALE CHAMBER OF COMMERCE,1200 S THOMPSON ST,SPRINGDALE,AR,72764,861104,CHAMBERS OF COMMERCE,81391005.0,BUSINESS ASSOCIATIONS,,,,,,,,,,,


In [44]:
igroup_sic_8611_dict['NC']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,QUEEN'S CUP STEEPLECHASE,6103 WAXHAW HWY,MINERAL SPRINGS,NC,28108,861102,ASSOCIATIONS,81391002.0,BUSINESS ASSOCIATIONS,,,,,,,,,,,


## SIC Code 0723 Exploration: Farm Produce

In [17]:
# To see how many matches exist within the dataframe consisting of SIC Codes containing 0723
df_sic_0723 = pd.read_csv("../data/code_0723.csv")
  
igroup_sic_0723_dict, ctrglow_0723_dict = infogroup_counterglow_dict(df_sic_0723, df_counterglow_poultry, states, RADIUS_KM)


In [47]:
# igroup_sic_0723_dict = keep_certain_columns(igroup_sic_0723_dict)

In [None]:
# loop through the infogroup dictionary, each key value matches to a dictionary
# grab the dictionary and append it to all_df_list

all_df_list = list_of_dataframes(igroup_sic_0723_dict, all_df_list)

#### Explore

## SIC Code 0191 Exploration: Farm Products

In [None]:
# To see how many matches exist within the dataframe consisting of SIC Codes containing 0191
df_sic_0191 = pd.read_csv("../data/code_0191.csv")
  
igroup_sic_0191_dict, ctrglow_0191_dict = infogroup_counterglow_dict(df_sic_0191, df_counterglow_poultry, states, RADIUS_KM)


In [50]:
# igroup_sic_0191_dict = keep_certain_columns(igroup_sic_0191_dict)

In [None]:
# loop through the infogroup dictionary, each key value matches to a dictionary
# grab the dictionary and append it to all_df_list

all_df_list = list_of_dataframes(igroup_sic_0191_dict, all_df_list)

#### Explore

In [51]:
igroup_sic_0191_dict['IA']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,KDD INC,4755 20TH ST,GRINNELL,IA,50112,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,999966.0,FEDERAL GOVERNMENT CONTRACTORS,,,,,,,,,
1,CENTRUM VALLEY FARMS,2975 WASHINGTON AVE,DOWS,IA,50071,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,,,,,,,,,,,
2,CENTURN VALLEY FARMS,2688 270TH ST,GALT,IA,50101,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,,,,,,,,,,,
3,CENTRUM VALLEY FARMS,2674 HIGHWAY 69,GALT,IA,50101,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,514403.0,EGGS (WHLS),541105.0,GROCERS-RETAIL,,,,,,,
4,DAVID HOAKISON FARMS,1089 JOSHUA AVE,CRESTON,IA,50801,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,,,,,,,,,,,
5,FORSMAN FARMS,2975 265TH ST,VILLISCA,IA,50864,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,,,,,,,,,,,
6,DE COSTER FARMS OF IOWA,1795 DOGWOOD AVE,ALEXANDER,IA,50420,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,,,,,,,,,,,
7,SIOUX COUNTY EGG FARM LLP,2716 380TH ST,SIOUX CENTER,IA,51250,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,514404.0,POULTRY-WHOLESALE,,,,,,,,,
8,MERLIN DE GROOT FARM,4702 360TH ST,SHELDON,IA,51201,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,,,,,,,,,,,
9,BROWN FARMS,2810 480TH AVE,GRAETTINGER,IA,51342,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,,,,,,,,,,,


In [53]:
igroup_sic_0191_dict['MO']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,JOHNSON COUNTY EGG FARM,1275 SE Y HWY,KNOB NOSTER,MO,65336,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,514403.0,EGGS (WHLS),,,,,,,,,
1,JOHNSON COUNTY EGG FARM,1285 SE Y HWY,KNOB NOSTER,MO,65336,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,514403.0,EGGS (WHLS),549914.0,EGGS-RETAIL,,,,,,,
2,DANNY MAZELIN FARM,33403 ALMOND RD,COLE CAMP,MO,65325,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,,,,,,,,,,,
3,RIVERAS FARMS LLC,1316 FARM ROAD 2155,EXETER,MO,65647,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,25401.0,POULTRY FARMS,,,,,,,,,
4,MOARK PRODUCTION INC,19242 MALLARD DR,NEOSHO,MO,64850,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,514403.0,EGGS (WHLS),549914.0,EGGS-RETAIL,,,,,,,
5,GM FARMS,17684 WALLEYE RD,FAIRVIEW,MO,64842,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,,,,,,,,,,,
6,ARNAUD VICTOR FARMS,7457 FARM ROAD 2040,MONETT,MO,65708,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,,,,,,,,,,,
7,DOCMO FARM,9988 COUNTY ROAD 488,DUDLEY,MO,63936,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,999966.0,FEDERAL GOVERNMENT CONTRACTORS,,,,,,,,,
8,DICK MCKUIN FARMS,2320 STATE HIGHWAY 25,BERNIE,MO,63822,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,25401.0,POULTRY FARMS,,,,,,,,,


In [54]:
igroup_sic_0191_dict['AL']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,NUNLEY FARMS LLC,12527 HIGHWAY 23,VINA,AL,35593,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,,,,,,,,,,,
1,WENDELL GIBBS FARMS,2118 COUNTY ROAD 23,RANBURNE,AL,36273,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,,,,,,,,,,,
2,C J FARMS,486 COUNTY ROAD 95,RANBURNE,AL,36273,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,,,,,,,,,,,
3,C J FARMS,486 COUNTY ROAD 95,RANBURNE,AL,36273,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,,,,,,,,,,,
4,GRANBERRY FARM,5955 COUNTY ROAD 55,COLUMBIA,AL,36319,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,,,,,,,,,,,
5,BAILEY FARMS,3536 SARDIS RD,ASHLAND,AL,36251,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,999966.0,FEDERAL GOVERNMENT CONTRACTORS,,,,,,,,,
6,GIBBS FARMS,1358 COUNTY ROAD 68,RANBURNE,AL,36273,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,,,,,,,,,,,
7,SOUTH HENRY PEANUTS INC,,HEADLAND,AL,36345,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,,,,,,,,,,,
8,HUGULEY FARMS INC,5405 N COUNTY ROAD 65,COFFEE SPRINGS,AL,36318,78203,SOD & SODDING SERVICE,56173019.0,LANDSCAPING SERVICES,19101.0,FARMS,,,,,,,,,
9,TRIPLE O FARMS LLC,643 GILBERT RD,LOWNDESBORO,AL,36752,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,999966.0,FEDERAL GOVERNMENT CONTRACTORS,,,,,,,,,


In [56]:
igroup_sic_0191_dict['MS']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,TCL POULTRY FARM,83 COURTNEY LN,BASSFIELD,MS,39421,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,,,,,,,,,,,
1,ROWLEY FARMS INC,313 ROWLEY RD,FOXWORTH,MS,39483,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,999966.0,FEDERAL GOVERNMENT CONTRACTORS,,,,,,,,,
2,B B FARMS,667 LOWER BROOKHAVEN RD,MONTICELLO,MS,39654,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,,,,,,,,,,,
3,MARTIN FARMS LLC,12302 HIGHWAY 98,SMITHDALE,MS,39664,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,,,,,,,,,,,
4,HOMOCHITTO POULTRY FARM,3118 CASEYVILLE RD NW,WESSON,MS,39191,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,,,,,,,,,,,
5,M & N FARMS,2868 SHILOH RD # A,PELAHATCHIE,MS,39145,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,,,,,,,,,,,
6,ALYSSA FARM LLC,1140 LAWRENCE CONEHATTA RD,LAWRENCE,MS,39336,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,,,,,,,,,,,
7,GREAT SOUTHERN FARMS LLC,1729 HIGHWAY 15,RICHTON,MS,39476,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,,,,,,,,,,,
8,STUBBS FARMS,129 MILITARY RD,SUMRALL,MS,39482,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,,,,,,,,,,,
9,J & D'S FARMS,964 TOWNSEND DR SE,BROOKHAVEN,MS,39601,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,,,,,,,,,,,


In [57]:
igroup_sic_0191_dict['IL']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,HI-GRADE EGG,317 E 360 NORTH RD # 2,LODA,IL,60948,201501,POULTRY PROCESSING PLANTS (MFRS),31161501.0,POULTRY PROCESSING,19101.0,FARMS,,,,,,,,,


In [58]:
igroup_sic_0191_dict['IN']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,ISCH FARMS INC,1977 S 400 W-1,BLUFFTON,IN,46714,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,,,,,,,,,,,
1,S & G POULTRY FARM,2496 S 400 W,MONROE,IN,46772,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,25401.0,POULTRY FARMS,,,,,,,,,
2,J & K TURKEY FARM LLC,4329 E 225 S,WASHINGTON,IN,47501,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,,,,,,,,,,,
3,PERDUE FARMS INC,500 PERDUE RD,VINCENNES,IN,47591,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,201501.0,POULTRY PROCESSING PLANTS (MFRS),25401.0,POULTRY FARMS,,,,,,,7529217.0
4,ROSE ACRE FARMS INC,5438 W STATE ROAD 16,RENSSELAER,IN,47978,25298,CHICKEN EGGS,11231001.0,CHICKEN EGG PRODUCTION,19101.0,FARMS,,,,,,,,,1081025.0
5,THOMAS BONTRAGER FARM,63666 COUNTY ROAD 37,GOSHEN,IN,46528,19198,GENERAL FARMS-PRIMARILY CROP,11199807.0,ALL OTHER MISCELLANEOUS CROP FARMING,24103.0,DAIRY FARMS,,,,,,,,,
6,JONES FARMS,12210 N BRADFORD RD NE,PALMYRA,IN,47164,19198,GENERAL FARMS-PRIMARILY CROP,11199807.0,ALL OTHER MISCELLANEOUS CROP FARMING,,,,,,,,,,,
7,MIDWEST PULLET FARMS,4854 S 1000 W,MENTONE,IN,46539,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,,,,,,,,,,,
8,MID RIVER FARMS,10335 COUNTY ROAD 18,MIDDLEBURY,IN,46540,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,999966.0,FEDERAL GOVERNMENT CONTRACTORS,,,,,,,,,
9,BROVONT SOW FARM INC,2322 W STATE ROAD 14,SILVER LAKE,IN,46982,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,,,,,,,,,,,


In [59]:
igroup_sic_0191_dict['OH']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,HERTZFELD POULTRY FARMS,15799 MILTON RD,GRAND RAPIDS,OH,43522,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,25401.0,POULTRY FARMS,,,,,,,,,
1,HOMAN FARMS,6671 ASHMAN RD,MARIA STEIN,OH,45860,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,13901.0,AGRICULTURAL PRODUCTS,,,,,,,,,


In [61]:
igroup_sic_0191_dict['TN']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,SUNSET RIDGE CATTLE CO,400 BRODIO RD,DEER LODGE,TN,37726,75102,LIVESTOCK BREEDERS,11521010.0,SUPPORT ACTIVITIES FOR ANIMAL PRODUCTION,19101.0,FARMS,,,,,,,,,


In [62]:
igroup_sic_0191_dict['AR']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,U-PICK IT FARM & GARDEN CORP,17369 WYOLA RD,WINSLOW,AR,72959,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,,,,,,,,,,,


In [64]:
igroup_sic_0191_dict['NC']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,LEONARD LAKES FARMS,329 LEONARD RD,LINCOLNTON,NC,28092,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,,,,,,,,,,,
1,CONYERS' FARMS,8520 COLLIERS CHAPEL CHURCH RD,LINDEN,NC,28356,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,,,,,,,,,,,
2,WHITESIDES FARM & RENTAL LLC,3287 JUNE BUG RD,VALE,NC,28168,19198,GENERAL FARMS-PRIMARILY CROP,11199807.0,ALL OTHER MISCELLANEOUS CROP FARMING,999966.0,FEDERAL GOVERNMENT CONTRACTORS,,,,,,,,,
3,ROCK CREEK FARM,7014 MOUNT HERMON ROCK CRK RD,SNOW CAMP,NC,27349,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,,,,,,,,,,,
4,ROCK CREEK FARM,7014 MOUNT HERMON ROCK CRK RD,SNOW CAMP,NC,27349,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,,,,,,,,,,,
5,MITCHELL FARMS,4167 CHURCH RD,TAYLORSVILLE,NC,28681,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,,,,,,,,,,,
6,MITCHELL FARMS,4167 CHURCH RD,TAYLORSVILLE,NC,28681,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,,,,,,,,,,,
7,MITCHELL FARMS,4167 CHURCH RD,TAYLORSVILLE,NC,28681,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,,,,,,,,,,,
8,MITCHELL FARMS,4167 CHURCH RD,TAYLORSVILLE,NC,28681,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,,,,,,,,,,,
9,FARM GRAND C,298 R AND R LN,TAYLORSVILLE,NC,28681,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,,,,,,,,,,,


In [65]:
igroup_sic_0191_dict['SC']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,WILSON RIDGE FARM LLC,5116 WYLIES MILL RD,EDGEMOOR,SC,29712,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,,,,,,,,,,,
1,BELGER FARMS & CONSTR INC,2044 BOYKIN RD,REMBERT,SC,29128,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,,,,,,,,,,,


In [66]:
igroup_sic_0191_dict['GA']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,HOUSE OF RAEFORD FARMS INC,55 COOPER RD,COMER,GA,30629,201501,POULTRY PROCESSING PLANTS (MFRS),31161501.0,POULTRY PROCESSING,19101.0,FARMS,,,,,,,,,513523.0


## SIC Code 254 Exploration: Poultry Farms

In [None]:
# To see how many matches exist within the dataframe consisting of SIC Codes containing 254
df_sic_254 = pd.read_csv("../data/code_254.csv")
  
igroup_sic_254_dict, ctrglow_254_dict = infogroup_counterglow_dict(df_sic_254, df_counterglow_poultry, states, RADIUS_KM)


In [68]:
# igroup_sic_254_dict = keep_certain_columns(igroup_sic_254_dict)

In [None]:
# loop through the infogroup dictionary, each key value matches to a dictionary
# grab the dictionary and append it to all_df_list

all_df_list = list_of_dataframes(igroup_sic_254_dict, all_df_list)

#### Explore

In [69]:
igroup_sic_254_dict['IA']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,VALO BIOMEDIA NORTH AMERICA,21459 OLD HIGHWAY 6,ADEL,IA,50003,283402,POULTRY MEDICINES & VACCINES (MFRS),32541208.0,PHARMACEUTICAL PREPARATION MANUFACTURING,25401.0,POULTRY FARMS,999966.0,FEDERAL GOVERNMENT CONTRACTORS,545101.0,DAIRY PRODUCTS-RETAIL,514404.0,POULTRY-WHOLESALE,,,843668294.0
1,VALO BIOMEDIA NORTH AMERICA,16332 OLD HIGHWAY 6,REDFIELD,IA,50233,283402,POULTRY MEDICINES & VACCINES (MFRS),32541208.0,PHARMACEUTICAL PREPARATION MANUFACTURING,873104.0,LABORATORIES,25401.0,POULTRY FARMS,,,,,,,843668294.0
2,CALEKO FARM INC,3819 330TH ST,BOYDEN,IA,51234,25401,POULTRY FARMS,11234001.0,POULTRY HATCHERIES,19101.0,FARMS,,,,,,,,,
3,REMBRANDT ENTERPRISES,4252 80 AVE,LINN GROVE,IA,51033,25401,POULTRY FARMS,11234001.0,POULTRY HATCHERIES,,,,,,,,,,,
4,REMBRANDT ENTERPRISES,4252 80 AVE,LINN GROVE,IA,51033,25401,POULTRY FARMS,11234001.0,POULTRY HATCHERIES,,,,,,,,,,,
5,IOWA CAGE FREE LLP,1035 200TH ST,GOLDFIELD,IA,50542,25401,POULTRY FARMS,11234001.0,POULTRY HATCHERIES,,,,,,,,,,,
6,FARMERS FRESH POULTRY,5195 FARMERS AVE SW,KALONA,IA,52247,25401,POULTRY FARMS,11234001.0,POULTRY HATCHERIES,543102.0,FARM MARKETS,,,,,,,,,
7,RIVERLAND POULTRY,2015 HIGHWAY 22,KALONA,IA,52247,25401,POULTRY FARMS,11234001.0,POULTRY HATCHERIES,,,,,,,,,,,


In [70]:
igroup_sic_254_dict['MO']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,LEUSCHEN POULTRY OPERATIONS,1175 DAIRY CIR,CRANE,MO,65633,514402,POULTRY SERVICES (WHLS),42444002.0,POULTRY & POULTRY PRODUCT MERCHANT WHOLESALERS,25401.0,POULTRY FARMS,,,,,,,,,
1,RIVERAS FARMS LLC,1316 FARM ROAD 2155,EXETER,MO,65647,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,25401.0,POULTRY FARMS,,,,,,,,,
2,DICK MCKUIN FARMS,2320 STATE HIGHWAY 25,BERNIE,MO,63822,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,25401.0,POULTRY FARMS,,,,,,,,,


In [71]:
igroup_sic_254_dict['AL']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,ROCK CREEK FARMS,400 COUNTY ROAD 134,TOWN CREEK,AL,35672,201501,POULTRY PROCESSING PLANTS (MFRS),31161501.0,POULTRY PROCESSING,19101.0,FARMS,25401.0,POULTRY FARMS,,,,,,,
1,FOUR H FARMS,2440 COUNTY ROAD 113,CENTRE,AL,35960,25401,POULTRY FARMS,11234001.0,POULTRY HATCHERIES,,,,,,,,,,,
2,BREEZY BOTTOM FARM,158 NICHOLS RD,ALTOONA,AL,35952,421304,TRUCKING,48423013.0,SPECIALIZED FREIGHT (EXC USED GDS) TRCKNG LNG-...,19101.0,FARMS,25401.0,POULTRY FARMS,,,,,,,
3,DALE MURPHY POULTRY,1355 WARRIOR VALLEY RD,ALTOONA,AL,35952,25401,POULTRY FARMS,11234001.0,POULTRY HATCHERIES,,,,,,,,,,,


In [73]:
igroup_sic_254_dict['MS']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,EVANS POULTRY FARMS,380 SCR 79,MIZE,MS,39116,201501,POULTRY PROCESSING PLANTS (MFRS),31161501.0,POULTRY PROCESSING,25401.0,POULTRY FARMS,,,,,,,,,


In [74]:
igroup_sic_254_dict['IN']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,EGG INNOVATIONS,4811 W 100 N,WARSAW,IN,46580,25401,POULTRY FARMS,11234001.0,POULTRY HATCHERIES,,,,,,,,,,,
1,RIVER VIEW FARMS INC,2262 E COUNTY ROAD 500 N,ORLEANS,IN,47452,25401,POULTRY FARMS,11234001.0,POULTRY HATCHERIES,,,,,,,,,,,
2,S & G POULTRY FARM,2496 S 400 W,MONROE,IN,46772,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,25401.0,POULTRY FARMS,,,,,,,,,
3,PERDUE FARMS INC,500 PERDUE RD,VINCENNES,IN,47591,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,201501.0,POULTRY PROCESSING PLANTS (MFRS),25401.0,POULTRY FARMS,,,,,,,7529217.0
4,MINNICH POULTRY,8563 E 300 N,PORTLAND,IN,47371,25401,POULTRY FARMS,11234001.0,POULTRY HATCHERIES,,,,,,,,,,,


In [75]:
igroup_sic_254_dict['OH']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,HERTZFELD POULTRY FARMS,15799 MILTON RD,GRAND RAPIDS,OH,43522,19101,FARMS,11199803.0,ALL OTHER MISCELLANEOUS CROP FARMING,25401.0,POULTRY FARMS,,,,,,,,,
1,MEYER HATCHERY,626 STATE ROUTE 89,POLK,OH,44866,92101,FISHERY CONSULTANTS,11251102.0,FINFISH FARMING & FISH HATCHERIES,25401.0,POULTRY FARMS,549907.0,POULTRY-RETAIL,,,,,,,


In [76]:
igroup_sic_254_dict['AR']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,GEORGE'S INC,402 W ROBINSON AVE,SPRINGDALE,AR,72764,201501,POULTRY PROCESSING PLANTS (MFRS),31161501.0,POULTRY PROCESSING,999966.0,FEDERAL GOVERNMENT CONTRACTORS,25401.0,POULTRY FARMS,,,,,,,512392.0


In [78]:
igroup_sic_254_dict['GA']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,TYSON FOODS INC,1151 E PINE ST,VIENNA,GA,31092,201501,POULTRY PROCESSING PLANTS (MFRS),31161501.0,POULTRY PROCESSING,514101.0,FOOD PRODUCTS (WHLS),209903.0,FOOD PRODUCTS & MANUFACTURERS,549907.0,POULTRY-RETAIL,549911.0,GAME BIRDS VENISON ETC,25401.0,POULTRY FARMS,7537913.0
1,CLAXTON POULTRY FARMS,8816 US HIGHWAY 301,CLAXTON,GA,30417,201501,POULTRY PROCESSING PLANTS (MFRS),31161501.0,POULTRY PROCESSING,25401.0,POULTRY FARMS,509901.0,EXPORTERS (WHLS),514404.0,POULTRY-WHOLESALE,514403.0,EGGS (WHLS),,,
2,PILGRIM'S PRIDE CORP,136 SWAN BRIDGE RD,TALKING ROCK,GA,30175,25401,POULTRY FARMS,11234001.0,POULTRY HATCHERIES,201501.0,POULTRY PROCESSING PLANTS (MFRS),,,,,,,,,987289857.0


## SIC Code 5144 Exploration: Poultry & Poultry Products

In [None]:
# To see how many matches exist within the dataframe consisting of SIC Codes containing 5144
df_sic_5144 = pd.read_csv("../data/code_5144.csv")
  
igroup_sic_5144_dict, ctrglow_5144_dict = infogroup_counterglow_dict(df_sic_5144, df_counterglow_poultry, states, RADIUS_KM)


In [80]:
# igroup_sic_5144_dict = keep_certain_columns(igroup_sic_5144_dict)

In [None]:
# loop through the infogroup dictionary, each key value matches to a dictionary
# grab the dictionary and append it to all_df_list

all_df_list = list_of_dataframes(igroup_sic_5144_dict, all_df_list)

#### Explore

In [81]:
igroup_sic_5144_dict['IA']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,VALO BIOMEDIA NORTH AMERICA,21459 OLD HIGHWAY 6,ADEL,IA,50003,283402,POULTRY MEDICINES & VACCINES (MFRS),32541208,PHARMACEUTICAL PREPARATION MANUFACTURING,25401.0,POULTRY FARMS,999966.0,FEDERAL GOVERNMENT CONTRACTORS,545101.0,DAIRY PRODUCTS-RETAIL,514404.0,POULTRY-WHOLESALE,,,843668294.0
1,FREMONT FARMS OF IOWA,3868 110TH ST,MALCOM,IA,50157,514403,EGGS (WHLS),42444001,POULTRY & POULTRY PRODUCT MERCHANT WHOLESALERS,999966.0,FEDERAL GOVERNMENT CONTRACTORS,,,,,,,,,
2,CENTRUM VALLEY FARMS,2674 HIGHWAY 69,GALT,IA,50101,19101,FARMS,11199803,ALL OTHER MISCELLANEOUS CROP FARMING,514403.0,EGGS (WHLS),541105.0,GROCERS-RETAIL,,,,,,,
3,IOWA CAGE FREE,1641 YELLOWSTONE AVE,CLEARFIELD,IA,50840,514403,EGGS (WHLS),42444001,POULTRY & POULTRY PRODUCT MERCHANT WHOLESALERS,541105.0,GROCERS-RETAIL,,,,,,,,,
4,OSAGE EGG CO,3405 KIRKWOOD AVE,OSAGE,IA,50461,514403,EGGS (WHLS),42444001,POULTRY & POULTRY PRODUCT MERCHANT WHOLESALERS,549914.0,EGGS-RETAIL,,,,,,,,,
5,SIOUX COUNTY EGG FARM LLP,2716 380TH ST,SIOUX CENTER,IA,51250,19101,FARMS,11199803,ALL OTHER MISCELLANEOUS CROP FARMING,514404.0,POULTRY-WHOLESALE,,,,,,,,,
6,E & W POULTRY FARM,2618 340TH ST,ROCK VALLEY,IA,51247,514403,EGGS (WHLS),42444001,POULTRY & POULTRY PRODUCT MERCHANT WHOLESALERS,549914.0,EGGS-RETAIL,,,,,,,,,
7,SUNRISE FARMS INC,2060 WHITE AVE,HARRIS,IA,51345,514403,EGGS (WHLS),42444001,POULTRY & POULTRY PRODUCT MERCHANT WHOLESALERS,19101.0,FARMS,,,,,,,,,
8,FREMONT FARMS,3205 295TH ST,FREMONT,IA,52561,514101,FOOD PRODUCTS (WHLS),42442005,PACKAGED FROZEN FOOD MERCHANT WHOLESALERS,514403.0,EGGS (WHLS),999966.0,FEDERAL GOVERNMENT CONTRACTORS,,,,,,,
9,FARMERS HEN HOUSE,1956 520TH ST SW,KALONA,IA,52247,514403,EGGS (WHLS),42444001,POULTRY & POULTRY PRODUCT MERCHANT WHOLESALERS,999966.0,FEDERAL GOVERNMENT CONTRACTORS,549914.0,EGGS-RETAIL,,,,,,,


In [82]:
igroup_sic_5144_dict['MO']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,JOHNSON COUNTY EGG FARM,1275 SE Y HWY,KNOB NOSTER,MO,65336,19101,FARMS,11199803,ALL OTHER MISCELLANEOUS CROP FARMING,514403.0,EGGS (WHLS),,,,,,,,,
1,KNOB NOSTER PULLETS,1251 SE Y HWY,KNOB NOSTER,MO,65336,514403,EGGS (WHLS),42444001,POULTRY & POULTRY PRODUCT MERCHANT WHOLESALERS,,,,,,,,,,,
2,JOHNSON COUNTY EGG FARM,1285 SE Y HWY,KNOB NOSTER,MO,65336,19101,FARMS,11199803,ALL OTHER MISCELLANEOUS CROP FARMING,514403.0,EGGS (WHLS),549914.0,EGGS-RETAIL,,,,,,,
3,LEUSCHEN POULTRY OPERATIONS,1175 DAIRY CIR,CRANE,MO,65633,514402,POULTRY SERVICES (WHLS),42444002,POULTRY & POULTRY PRODUCT MERCHANT WHOLESALERS,25401.0,POULTRY FARMS,,,,,,,,,
4,MOARK PRODUCTION,17331 HIGHWAY D,NEOSHO,MO,64850,514403,EGGS (WHLS),42444001,POULTRY & POULTRY PRODUCT MERCHANT WHOLESALERS,549914.0,EGGS-RETAIL,,,,,,,,,
5,MOARK PRODUCTION INC,19242 MALLARD DR,NEOSHO,MO,64850,19101,FARMS,11199803,ALL OTHER MISCELLANEOUS CROP FARMING,514403.0,EGGS (WHLS),549914.0,EGGS-RETAIL,,,,,,,


In [83]:
igroup_sic_5144_dict['AL']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,KOCH FOODS INC,764 GEORGE CAGLE DR,COLLINSVILLE,AL,35961,201501,POULTRY PROCESSING PLANTS (MFRS),31161501,POULTRY PROCESSING,514402.0,POULTRY SERVICES (WHLS),,,,,,,,,517549762.0


In [84]:
igroup_sic_5144_dict['MS']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,TOTAL POULTRY SVC LLC,130 STOVALL RD # 2,KOKOMO,MS,39643,514402,POULTRY SERVICES (WHLS),42444002,POULTRY & POULTRY PRODUCT MERCHANT WHOLESALERS,,,,,,,,,,,


In [85]:
igroup_sic_5144_dict['IN']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,WABASH VALLEY PRODUCE INC,4886 E 450N,DUBOIS,IN,47527,204803,FEED-MANUFACTURERS,31111903,OTHER ANIMAL FOOD MANUFACTURING,519112.0,FEED-DEALERS (WHLS),514403.0,EGGS (WHLS),549914.0,EGGS-RETAIL,999966.0,FEDERAL GOVERNMENT CONTRACTORS,,,


In [86]:
igroup_sic_5144_dict['KY']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,CAL-MAINE FOODS INC,9729 GUTHRIE RD,GUTHRIE,KY,42234,514403,EGGS (WHLS),42444001,POULTRY & POULTRY PRODUCT MERCHANT WHOLESALERS,,,,,,,,,,,431481290.0


In [88]:
igroup_sic_5144_dict['NC']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,SIMPSON'S EGGS INC,5015 E HIGHWAY 218,MONROE,NC,28110,514403,EGGS (WHLS),42444001,POULTRY & POULTRY PRODUCT MERCHANT WHOLESALERS,549914.0,EGGS-RETAIL,,,,,,,,,


In [89]:
igroup_sic_5144_dict['GA']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,CLAXTON POULTRY FARMS,8816 US HIGHWAY 301,CLAXTON,GA,30417,201501,POULTRY PROCESSING PLANTS (MFRS),31161501,POULTRY PROCESSING,25401.0,POULTRY FARMS,509901.0,EXPORTERS (WHLS),514404.0,POULTRY-WHOLESALE,514403.0,EGGS (WHLS),,,


## SIC Code 5154 Exploration: Livestock

In [21]:
# To see how many matches exist within the dataframe consisting of SIC Codes containing 5154
df_sic_5154 = pd.read_csv("../data/code_5154.csv")
  
igroup_sic_5154_dict, ctrglow_5154_dict = infogroup_counterglow_dict(df_sic_5154, df_counterglow_poultry, states, RADIUS_KM)


In [91]:
# igroup_sic_5154_dict = keep_certain_columns(igroup_sic_5154_dict)

In [None]:
# loop through the infogroup dictionary, each key value matches to a dictionary
# grab the dictionary and append it to all_df_list

all_df_list = list_of_dataframes(igroup_sic_5154_dict, all_df_list)

#### Explore

In [93]:
igroup_sic_5154_dict['AL']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,ROCKING W LIVESTOCK EQPT SALES,600 N JOHNSON CHAPEL RD,DANVILLE,AL,35619,515403,LIVESTOCK-DEALERS (WHLS),42452008,LIVESTOCK MERCHANT WHOLESALERS,,,,,,,,,,,
1,MID STATE STOCKYARDS LLP,8415 STATE HIGHWAY 97 S,LETOHATCHEE,AL,36047,478904,STOCK YARDS,48821007,SUPPORT ACTIVITIES FOR RAIL TRANSPORTATION,515402.0,LIVESTOCK AUCTION MARKETS (WHLS),,,,,,,,,


## SIC Code 0251: Broiler, Fryer, and Roaster Chickens

In [22]:
# To see how many matches exist within the dataframe consisting of SIC Codes containing 0251
df_sic_0251 = pd.read_csv("../data/code_0251.csv")
  
igroup_sic_0251_dict, ctrglow_0251_dict = infogroup_counterglow_dict(df_sic_0251, df_counterglow_poultry, states, RADIUS_KM)


NC: Total number of matches: 1


In [97]:
# igroup_sic_0251_dict = keep_certain_columns(igroup_sic_0251_dict)

In [None]:
# loop through the infogroup dictionary, each key value matches to a dictionary
# grab the dictionary and append it to all_df_list

all_df_list = list_of_dataframes(igroup_sic_0251_dict, all_df_list)

#### Explore

In [98]:
igroup_sic_0251_dict['MO']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,TRIPLE P RANCH & EQUIPMENT LLC,22211 FIVE BRIDGES AVE,COLE CAMP,MO,65325,25198,BROILER FRYER & ROASTER CHICKENS,11232001,BROILERS & OTHER MEAT TYPE CHICKEN PRODUCTION,508303.0,POULTRY EQUIPMENT & SUPPLIES (WHLS),,,,,,,,,


In [99]:
igroup_sic_0251_dict['AL']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,WOODHAM FARM,2501 COUNTY ROAD 53,CLAYTON,AL,36016,25298,CHICKEN EGGS,11231001,CHICKEN EGG PRODUCTION,25198.0,BROILER FRYER & ROASTER CHICKENS,,,,,,,,,


In [102]:
igroup_sic_0251_dict['NC']

Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,PRIMARY SIC CODE,SIC6_DESCRIPTIONS,PRIMARY NAICS CODE,NAICS8 DESCRIPTIONS,SIC CODE,SIC6_DESCRIPTIONS (SIC),SIC CODE 1,SIC6_DESCRIPTIONS (SIC1),SIC CODE 2,SIC6_DESCRIPTIONS(SIC2),SIC CODE 3,SIC6_DESCRIPTIONS(SIC3),SIC CODE 4,SIC6_DESCRIPTIONS(SIC4),PARENT NUMBER
0,REYNOLDS FARMS,7518 CARL POLK RD,MONROE,NC,28110,25198,BROILER FRYER & ROASTER CHICKENS,11232001,BROILERS & OTHER MEAT TYPE CHICKEN PRODUCTION,,,,,,,,,,,


## To CSV

In [None]:
### concat all DataFrames & convert to csv

infogroup_concat = pd.concat(all_df_list)

FILEPATH = "../data/infogroup_matches_.csv"
infogroup_concat.to_csv(FILEPATH) # save as CSV file

## NO SIC CODE: Looking for hits on certain states

Below code not executed. Can be ignored. Files too large to run on computer, aborted before finished

In [13]:
certain_states = ['IA', 'OK', 'MO', 'OK', 'AL', 'LA', 'MS', 'IL', 'IN', 'OH', 'KY', 'TN', 'AR', 'NC', 'SC', 'GA']

In [9]:
RADIUS_KM = 0.321869

In [60]:
"""
funtion will take 4 inputs. infogroup_df & counterglow_df2 are the dataframes being analyzed.
the third input is the specific state that we are choosing to analyze
the fourth input is the threshold distance. this distance is the max allowable distance between 2
datapoints. the output is a dataframe that in each row, we have a datapoint that represents a
datapoint from infogroup and (x distance away) a farm spotted in the counterglow data. we are
speculating that it is possible for a spotted farm in counterglow to not have the most precise address
and actually exist in the Infogroup data, but with slightly different longitude and latitude
"""

def potential_farms_mod(infogroup_df, counterglow_df, max_dist_km):
    
    # print("Computing infogroup...")
    # infogroup_df     = infogroup_df.compute()
    
    # print("Computing counterglow...")
    # counterglow_df   = counterglow_df.compute()
    
    # create two new empty dataframe that we will be adding to when match is found
    infogroup_trim     = pd.DataFrame(columns=infogroup_df.columns)
    counterglow_trim   = pd.DataFrame(columns=counterglow_df.columns)
    
    counter = 0 # to counter matches, can print to terminal if desired
    
    print("Starting for i loop...")
    for i in range(len(infogroup_df)):
        print("starting here...")
        # infogroup_longitude  = infogroup_df.iloc[i]["LONGITUDE"].compute()  # get longitude
        # infogroup_latitude   = infogroup_df.iloc[i]["LATITUDE"].compute()   # get latitude
        
        infogroup_longitude  = infogroup_df.loc[i, "LONGITUDE"].compute()   # get longitude
        infogroup_latitude   = infogroup_df.loc[i, "LATITUDE"].compute()    # get latitude
        
        print(infogroup_longitude, infogroup_latitude)
        
        
        # for j in range(len(counterglow_df)):
            
        #     # counterglow_latitude    = counterglow_df.iloc[j]["Lat"].compute()    # get latitude
        #     # counterglow_longitude   = counterglow_df.iloc[j]["Lat.1"].compute()  # get longitude
        #     counterglow_latitude    = counterglow_df.loc[j, "Lat"]    # get latitude
        #     counterglow_longitude   = counterglow_df.loc[j, "Lat.1"]  # get longitude
            
        #     print(type(infogroup_longitude), type(infogroup_latitude), type(counterglow_longitude), type(counterglow_latitude))
            
        #     dist_km                 = haversine(infogroup_longitude, infogroup_latitude, 
        #                                         counterglow_longitude, counterglow_latitude)
            
        #     if(dist_km <= max_dist_km): # if the distance is <= the max distance set in function
        #         counter += 1
                
        #         # new_row = infogroup_df.iloc[i]
        #         # infogroup_trim.loc[len(infogroup_trim.index)]      = infogroup_df.iloc[i]
        #         infogroup_trim = dd.concat([infogroup_trim, infogroup_df.iloc[i]], axis=0)
                
        #         # counterglow_trim.loc[len(counterglow_trim.index)]  = counterglow_df.iloc[j]
        #         counterglow_trim = dd.concat([counterglow_trim, counterglow_trim.iloc[j]], axis=0)
                
        
    # change the name of the columns for Latitude & Longitude in each dataframe
    # for Infogroup Dataframe
    infogroup_trim      = infogroup_trim.rename(columns={'LATITUDE': 'LATITUDE 1', 
                                                        'LONGITUDE': 'LONGITUDE 1'})
    counterglow_trim    = counterglow_trim.rename(columns={'Lat' : 'LATITUDE 2',
                                                           'Lat.1': 'LONGITUDE 2'})           
    return infogroup_trim, counterglow_trim   
    

In [55]:
# load counterglow dataset
# df_counterglow = pd.read_csv("../data/Counterglow+Facility+List+Complete.csv")
df_counterglow = dd.read_csv("../data/Counterglow+Facility+List+Complete.csv", dtype=str, encoding='unicode_escape')

In [56]:
df_counterglow = df_counterglow[df_counterglow['State'].isin(certain_states)]
df_counterglow = df_counterglow.compute()

In [None]:
df_counterglow['State'].value_counts()

In [58]:
# df_infogroup = pd.read_csv("../data/certain_states.csv")
df_infogroup = dd.read_csv("../data/certain_states.csv", dtype=str, encoding='unicode_escape')
df_infogroup.compute()

Unnamed: 0.1,Unnamed: 0,COMPANY,ADDRESS LINE 1,CITY,STATE,ZIPCODE,ZIP4,COUNTY CODE,AREA CODE,IDCODE,...,POPULATION CODE,CENSUS TRACT,CENSUS BLOCK,LATITUDE,LONGITUDE,MATCH CODE,CBSA CODE,CBSA LEVEL,CSA CODE,FIPS CODE
0,1,,11700 OLIO RD,FISHERS,IN,46037,7618,057,317,1,...,7,110808,1,039.959999,-085.921268,P,26900,2,294,18057
1,9,,11725 ILLINOIS ST # 140,CARMEL,IN,46032,3010,057,317,1,...,7,111001,2,039.951396,-086.160933,0,26900,2,294,18057
2,10,,11725 ILLINOIS ST # 140,CARMEL,IN,46032,3010,057,317,1,...,7,111001,2,039.951396,-086.160933,0,26900,2,294,18057
3,13,MADISON COUNTY COURTHOUSE,16 E 9TH ST,ANDERSON,IN,46016,1598,095,765,2,...,6,011900,2,040.107502,-085.678706,P,26900,2,294,18095
4,18,DOG HAUS VENUE,12880 E 146TH ST,NOBLESVILLE,IN,46060,9582,057,317,2,...,7,110100,3,040.005310,-085.930786,P,26900,2,294,18057
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
231448,172074,SUPERIOR TILE,400 ERASTE LANDRY RD,LAFAYETTE,LA,70506,2324,055,337,2,...,7,000602,2,030.229632,-092.043905,P,29180,2,318,22055
231449,172076,NEW BEGINNINGS CHRISTIAN ACAD,401 W POPLAR ST,ELIZABETHTOWN,KY,42701,1743,093,270,2,...,7,001402,3,037.700819,-085.865386,0,21060,2,350,21093
231450,172084,JIM'S LOUNGE,213 E GLORIA SWITCH RD,LAFAYETTE,LA,70507,,055,337,2,...,6,001001,1,030.281900,-092.025500,X,29180,2,318,22055
231451,172085,A-BEAR'S KIDS ONLY PRESCHOOL,155 GRAND AVE,LAFAYETTE,LA,70503,4636,055,337,2,...,7,001700,4,030.181455,-092.059365,P,29180,2,318,22055


In [61]:
infogroup_matches, counterglow_matches = potential_farms_mod(df_infogroup, df_counterglow, RADIUS_KM)

Starting for i loop...


starting here...
0    -085.921268
0    -088.022737
0    -094.797800
0    -083.880811
0    -085.652630
0    -092.421922
0    -085.711388
0    -090.557094
0    -082.586227
0    -092.383231
0    -081.797501
0    -083.873633
0    -095.922500
0    -091.160516
0    -089.991122
0    -086.158777
0    -087.568974
0    -087.747498
0    -087.644586
0    -090.148745
Name: LONGITUDE, dtype: object 0    039.959999
0    042.103739
0    036.607700
0    033.978724
0    038.269739
0    042.542957
0    038.327187
0    038.136055
0    032.381588
0    036.333650
0    040.421810
0    034.230394
0    036.732000
0    030.393809
0    035.137792
0    040.488876
0    038.249576
0    042.058970
0    041.940211
0    041.862457
Name: LATITUDE, dtype: object
starting here...


KeyboardInterrupt: 