In [75]:
import pandas as pd
import numpy as np

### Comparing poultry in AK

Across the two datasets, there are 7 CAFOs registered in both, while 10/17 CAFOs in Iowa's dataset are unique and 299/306 CAFOs in Counterglow's dataset are unique.

In [76]:
counterglow = pd.read_csv("../data/Counterglow+Facility+List+Complete.csv")
iowa_ar = pd.read_csv("../data/Poultry CAFOs in Arkansas.csv")

In [102]:
counterglow["Name"] = counterglow["Name"].astype(str, copy=False).apply(lambda x : x.title())

In [103]:
iowa_ar["NAME"] = iowa_ar["NAME"].apply(lambda x : x.title())

In [106]:
cg_ar = counterglow[counterglow["State"]=="AR"]["Name"]

both = []
only_iowa = []

for i in list(iowa_ar["NAME"]):
    if i in list(cg_ar):
        both.append(i)
    else:
        only_iowa.append(i)

In [100]:
only_cg = []

for i in cg_ar:
    if i not in both:
        only_cg.append(i)

len(only_cg)

299

In [107]:
both, only_iowa, only_cg

(['Cal-Maine Foods',
  'Todd Avery Poultry',
  'Hindsville Research Farm',
  'Khoi Nguyen Poultry Pads',
  'Nguyen Poultry',
  'U Of A Poultry Farm',
  'Robert Squires Farm'],
 ['Benton County Foods/Feemster',
  'Pitcher Farms',
  'Tyson Foods-Rison Hatchery',
  'Keith Smith Co., Inc.',
  'Con Agra Foods-Refrig Foods',
  'Wesley Farms',
  'Pilgrims Pride-Nashville Feed',
  'Mcminn Breeder Houses',
  'Arkansas Egg Co.,Inc./Summers',
  'Tyson Foods-Lincoln Hatchery'],
 ['\xa0Central Ark Prca Rodeo\xa0',
  '\xa0Hills Auto Sales Pro Rodeo\xa0',
  '\xa0Magnolia Stampede\xa0',
  '\xa0Old Fort Days Rodeo\xa0',
  '\xa0Sharp County Fair Rodeo\xa0',
  '1St West.Bank/ Pam Beahm Farm',
  'Ackerman, Gary',
  'Alexander, Scott/S & A Farms',
  'Alexander, Steve',
  'Alexander, Steve & Kim',
  'Ar Tech Univ.Foun./Alpha Farm',
  'Arch Farms, Llc',
  'Arkansas Department Of Corrections',
  'Arkansas Egg Co. Llc - Appletown',
  'Arnold, Billy',
  'Aubrey Kinion - Tyson',
  'Ayers, Ronnie',
  'Bacon Creek

### Generalized comparison function

- Alabama had the most CAFOs in common between the two datasets, all other states had far fewer or none
- Arkansas, North Carolina, and Texas had the least data from the University of Iowa, otherwise the number of entries between the two datasets was usually balanced
- Unnamed/NaN/Unknown farms were excluded from both datasets before analysis

In [173]:
def compare_CAFOs(cg_path, iowa_path, state):
    counterglow = pd.read_csv(cg_path)
    iowa = pd.read_csv(iowa_path)
    counterglow["Name"] = counterglow["Name"].astype(str, copy=False).apply(lambda x : x.title())
    iowa["NAME"] = iowa["NAME"].apply(lambda x : x.title())

    cg_state = [i for i in counterglow[counterglow["State"]==state]["Name"] if i != "Unknown" and i != "Nan"]
    iowa_unique = list(iowa["NAME"].dropna())

    both, only_iowa, only_cg = [], [], []

    for i in iowa_unique:
        if i in cg_state:
            both.append(i)
        else:
            only_iowa.append(i)

    for i in cg_state:
        if i not in both:
            only_cg.append(i)

    print("Common to both: " + str(len(both)) + "\nOnly in Iowa dataset: " + str(len(only_iowa)) + "\nOnly in Counterglow: " + str(len(only_cg)))
    return (both, only_iowa, only_cg)

In [174]:
cg_path = "../data/Counterglow+Facility+List+Complete.csv"
iowa_path = "../data/Poultry CAFOs in Mississippi.csv"

compare_CAFOs(cg_path, iowa_path, "MS")

Common to both: 30
Only in Iowa dataset: 530
Only in Counterglow: 523


(['Judson Wilson, Poultry',
  'Brenda Perry, Poultry',
  'Jason Smith, Poultry Farm Two',
  'Tucker Estes, Poultry',
  'Charles Cumberland, Poultry',
  'Eliza Thomas, Poultry',
  'Nathan Hayes, Poultry',
  'Julian Franco, Poultry Farm 2',
  'Johnnie W Marshall, Poultry',
  'David Breazeale, Poultry',
  'Phil Rhinewalt, Poultry',
  'Clint And Jessica Akerman, Poultry',
  'Chris Carter, Poultry',
  'Jerry Watkins, Poultry',
  'Chris Sims, Poultry',
  'Tim And Sherry Conner, Poultry',
  'Steve Thornton, Poultry',
  'Rickey Johnson, Poultry',
  'Jeremy Bardon, Poultry',
  'Kathy Hill, Poultry',
  'Harry Mclain, Poultry',
  'Rod Yelverton, Poultry',
  'Charles David Williams, Poultry',
  'Joey Thrash, Poultry',
  'Ryan Hillhouse, Poultry Farm Number 2',
  'Josh Slay, Poultry',
  'Scott Mincey, Poultry',
  'Danny Ginn, Poultry',
  'Tristan Howell, Poultry',
  'Barry Sharp, Poultry'],
 ['Randy Flake, Poultry',
  'Sorgum Branch Poultry Farm',
  'Devon Sharp, Poultry',
  'Bobby Wilson, Poultry'

In [175]:
cg_path = "../data/Counterglow+Facility+List+Complete.csv"
iowa_path = "../data/Poultry CAFOs in Alabama.csv"

compare_CAFOs(cg_path, iowa_path, "AL")

Common to both: 576
Only in Iowa dataset: 456
Only in Counterglow: 437


(['Abercrombie Farms',
  'Beaty Poultry Farm',
  'C And C Farms',
  'Chaney Branch Farms',
  'Cox Farms',
  'Eric Sutton Poultry',
  'Four H Farm',
  'Helms Poultry Farms',
  'Mcrae Poultry Farms',
  'Noel Welch Farms',
  'Parsons Farm',
  'Pinnacle Farms',
  'Shane Bowman Farms',
  'Southern Pride Poultry Farm',
  'Todd Sconyers Farm',
  'Tyler Poultry Farms',
  'Woodham Farms',
  'Big Spring Creek Farm',
  'Curtis Hawkins Farm',
  'Dixieland Farms',
  'Double H Farm',
  'Faith Farm',
  'Fort Bragg Farm',
  'Graves Creek Farm',
  'Green Acres Farm',
  'Holmes Farms Inc.',
  'Maze Farm Inc.',
  'Miller Poultry, Llc',
  'Murphree Valley Farms',
  'Rock Springs Farm, Llc',
  'Sdh Farm',
  'Slap Happy Farm',
  'Smith Farms',
  'Whitley Poultry Farm',
  'Charles Kilpatrick',
  'Craig Grant',
  'Faron Frazier Farm',
  'Gafford Farms',
  'Harold Parmer',
  'James M Kilpatrick Farm',
  'Jerry Stinson',
  'Ken Burkett',
  'Lloyd Shell Farm',
  'Mitchell Farms',
  'Randy Smith',
  'Tommy Thomps

In [176]:
cg_path = "../data/Counterglow+Facility+List+Complete.csv"
iowa_path = "../data/Poultry CAFOs in Arkansas.csv"

compare_CAFOs(cg_path, iowa_path, "AR")

Common to both: 7
Only in Iowa dataset: 10
Only in Counterglow: 232


(['Cal-Maine Foods',
  'Todd Avery Poultry',
  'Hindsville Research Farm',
  'Khoi Nguyen Poultry Pads',
  'Nguyen Poultry',
  'U Of A Poultry Farm',
  'Robert Squires Farm'],
 ['Benton County Foods/Feemster',
  'Pitcher Farms',
  'Tyson Foods-Rison Hatchery',
  'Keith Smith Co., Inc.',
  'Con Agra Foods-Refrig Foods',
  'Wesley Farms',
  'Pilgrims Pride-Nashville Feed',
  'Mcminn Breeder Houses',
  'Arkansas Egg Co.,Inc./Summers',
  'Tyson Foods-Lincoln Hatchery'],
 ['\xa0Central Ark Prca Rodeo\xa0',
  '\xa0Hills Auto Sales Pro Rodeo\xa0',
  '\xa0Magnolia Stampede\xa0',
  '\xa0Old Fort Days Rodeo\xa0',
  '\xa0Sharp County Fair Rodeo\xa0',
  '1St West.Bank/ Pam Beahm Farm',
  'Ackerman, Gary',
  'Alexander, Scott/S & A Farms',
  'Alexander, Steve',
  'Alexander, Steve & Kim',
  'Ar Tech Univ.Foun./Alpha Farm',
  'Arch Farms, Llc',
  'Arkansas Department Of Corrections',
  'Arkansas Egg Co. Llc - Appletown',
  'Arnold, Billy',
  'Aubrey Kinion - Tyson',
  'Ayers, Ronnie',
  'Bacon Creek

In [177]:
cg_path = "../data/Counterglow+Facility+List+Complete.csv"
iowa_path = "../data/Poultry CAFOs in North Carolina.csv"

compare_CAFOs(cg_path, iowa_path, "NC")

Common to both: 10
Only in Iowa dataset: 9
Only in Counterglow: 322


(['Flint Ridge Pullet Farm',
  'Gardner Farms 2',
  'Hyde County Egg Farm',
  'Hyde County Egg Farm',
  'Red Hill Eggs Llc',
  'Rose Poultry Farm',
  'Spring Hope Poultry Inc 2',
  'A&D Poultry',
  "Latta'S Egg Ranch",
  "Simpson'S Eggs Inc"],
 ['Xiong Farm',
  'Chicken Hollow Farms',
  'D&M Poultry',
  'Edwin Reid Poultry Farm',
  'Production Enterprise Inc. Farm',
  'Yang Farm',
  'Warren Boone Farm',
  'Twin J Farms',
  'Enterprise Farm Caledonia'],
 ['A.D. And Carlton Williard',
  'Acorn Ridge',
  'Acre Station Meat Farm',
  'Alan Coble Farm',
  'Alan Smith Dairy Farm',
  'Anderson Farm',
  'Armo Llc',
  'Arrowhead Poultry',
  'Asj Mathis Farms, Llc',
  'Aycoth Farm',
  'B&P Farms',
  'Back\xa0Forty\xa0Farm (Bw\xa0Pope,\xa0Inc.)',
  'Barbara Walker/Walker Farms',
  'Barbara Wall',
  'Barefoot\xa0Farm',
  'Bb Dairy',
  'Beal Family Farms',
  'Beam Dairy',
  'Beam Dairy',
  'Beard Farm',
  'Beaver-Rill Farms, Inc',
  'Beeson Farm',
  'Benson Sow Farm Llc',
  'Bethel Farm',
  'Beville

In [178]:
cg_path = "../data/Counterglow+Facility+List+Complete.csv"
iowa_path = "../data/Poultry CAFOs in South Carolina.csv"

compare_CAFOs(cg_path, iowa_path, "SC")

Common to both: 0
Only in Iowa dataset: 629
Only in Counterglow: 32


([],
 ['Mark Speer Poultry Farm',
  'Nicholas Stokes Poultry',
  'Padgett Poultry House',
  'Padgett Poultry House',
  'Mcfarlan Farm',
  'Red Legged Rooster',
  'Marc Marsh/ Rooster Coop',
  'Smith, S L,  Breeder Farm',
  'Rafael Poultry',
  'Creekside Farm',
  'Quail Creek Farm',
  'Evans, Mitchell/Broiler Facili',
  'Sanders Breeder Farm',
  'Windy Hill Poultry Farm',
  'Fickling, Tal/Breeder Farm',
  'Humble Acres Breeder Farm',
  'A.T. Gales Breeder Operation',
  'Cullen Bolen, Llc',
  'Walker Nix Breeder Farm',
  'Swartz Breeder Facility',
  'Norris Farms (Breeders)',
  'Den-Mar Farms (Mccaskill)',
  'South Fork Farms',
  'Corn House Farm',
  'Knight Breeder Farm',
  'Huckleberry Head Farm',
  'Osborne Poultry Farm',
  'Sandifer & Son Farms',
  'Smoak Poultry Farm',
  'Four Winds Farm',
  'Bay Branch Poultry Farm',
  'Carey Frick Breeder Farm',
  'Vintage Acres, Llc',
  'Samples Poultry Farms',
  'Brown Poultry Farm',
  'Vasser Poultry Farm',
  'Bolen Poultry Farm',
  'Jeff David

In [180]:
cg_path = "../data/Counterglow+Facility+List+Complete.csv"
iowa_path = "../data/Poultry CAFOs in Texas.csv"

compare_CAFOs(cg_path, iowa_path, "TX")

Common to both: 10
Only in Iowa dataset: 16
Only in Counterglow: 521


(['Texas Department Of Criminal Justice',
  'Texas Department Of Criminal Justice',
  'Texas Department Of Criminal Justice',
  'Texas Department Of Criminal Justice',
  'Texas Department Of Criminal Justice',
  'Texas Department Of Criminal Justice',
  'Texas Department Of Criminal Justice',
  'Texas Department Of Criminal Justice',
  'Texas Department Of Criminal Justice',
  'Texas Department Of Criminal Justice'],
 ['Feather Crest Farms Inc',
  'Brunner, Allan James',
  'Idalou Egg Ranch Lp',
  'Cal-Maine Foods Inc',
  'Cal-Maine Foods Inc',
  'Cal-Maine Foods Inc',
  'Cal-Maine Foods Inc',
  'Cal-Maine Foods Inc',
  'Cal-Maine Foods Inc',
  'Kieke Egg Farm Llc',
  'Cal-Maine Foods Inc',
  'Wharton County Foods Llc',
  'Feather Crest Farms Inc',
  'Red River Valley Egg Farm Llc',
  'Cal-Maine Foods Inc',
  'Cal-Maine Foods Inc'],
 ['\xa0\xa0Matagorda County Fair & Rodeo',
  '\xa0Abc Pro Rodeo\xa0',
  '\xa0Angelina Benefit Rodeo\xa0',
  '\xa0Bandera Pro Rodeo\xa0',
  '\xa0Bell County