In [6]:
# Purpose of this doc is to be able to import any title company data and format it in a way such that complete names, companies, etc. are all 
# parsed and ready for proper skip-tracing
import pandas as pd

In [7]:
filename = "absentee_98001_98003_20-50_imps_5yrs_owned"
raw = pd.read_csv(f'./data/{filename}/{filename}.csv')

In [8]:
raw.columns

Index(['Parcel #', 'Owner First', 'Owner Last', 'Owner Full', 'Site',
       'Site City', 'Site State', 'Site Zip', 'Mail', 'Mail City',
       'Mail State', 'Mail Zip', 'Bedrooms', 'Bathrooms', 'Building Sq Ft',
       'Lot Sq Ft', 'Acres', 'Year Built', '% Improvement', 'Total AV',
       'Improvement AV', 'Land AV', 'Taxes', 'Tax Year ', 'Sale Date', 'Price',
       'Zoning', 'Land Use'],
      dtype='object')

In [57]:
TITLECO_MAPPING = {
    'Parcel #': "parcel",
    'Owner Full': "full_name",
    'Owner Last': "last_name",
    'Owner First': "first_name",
    'Mail': "mail_add",
    'Mail City': "mail_city",
    'Mail State': "maill_state",
    'Site':"prop_add",
    'Site City':"prop_city",
    'Site State':"prop_state",
    'Site Zip':"prop_zip"
}
ENTITY_NAMES = "|".join(["Inc", "Trust", "L L C", "LLC", "Corp", "Homes", "Co"])
mapped_cols = raw[TITLECO_MAPPING.keys()].rename(LISTSOURCE_MAPPING, axis=1)

In [69]:
mapped_cols[(mapped_cols.full_name.str.contains(ENTITY_NAMES, na=True, regex=True))]

Unnamed: 0,parcel,full_name,last_name,first_name,mail_add,mail_city,maill_state,prop_add,prop_city,prop_state,prop_zip
7,3321049039,Federal Way Central Presbyterian Co,Co,Federal Way Central Presbyterian,32210 24th Ave SW,Federal Way,WA,37427 28th Ave S,Federal Way,WA,98003
9,7967600261,Dimension Townhouses LLC,Dimension Townhouses LLC,,PO Box 58264,Seattle,WA,27855 46th Ave S,Auburn,WA,98001
15,7853600045,Shannon K Hooper Trust,Hooper Shannon K Trust,,43670 Carmel Cir,Palm Desert,CA,31021 20th Ave S,Federal Way,WA,98003
29,7203000461,Mountain Niso LLC,Mountain Niso LLC,,PO Box 3482,Redmond,WA,28430 14th Ave S,Federal Way,WA,98003
34,4045700675,Orcas Homes LLC,Orcas Homes LLC,,12411 NE 80th Way,Kirkland,WA,3412 S 360th St,Auburn,WA,98001
35,5066400035,Overcomer Covenant Church,Overcomer Covenant Church,,33415 Military Rd S,Auburn,WA,33607 Military Rd S,Auburn,WA,98001
36,5066400120,Overcomer Covenant Church,Overcomer Covenant Church,,33415 Military Rd,Auburn,WA,4406 S 338th St,Auburn,WA,98001
37,3751604107,People Infra LLC,People Infra LLC,,4012 164th Ct NE,Redmond,WA,4200 S 360th St,Auburn,WA,98001
39,5151600415,Powell Rental Co,Powell Rental Co,,PO Box 66708,Burien,WA,1103 S 299th Pl,Federal Way,WA,98003
45,1547600150,Schneider Family Homes LLC,Schneider Family Homes LLC,,6510 Southcenter Blvd #1,Tukwila,WA,28202 48th Ave S,Auburn,WA,98001


In [61]:
mapped_cols[(mapped_cols.first_name.str.contains("Inc|Trust|LLC|L L C|Assembly|corp|Homes|Co", na=True, regex=True))]

Unnamed: 0,parcel,full_name,last_name,first_name,mail_add,mail_city,maill_state,prop_add,prop_city,prop_state,prop_zip
9,7967600261,Dimension Townhouses LLC,Dimension Townhouses LLC,,PO Box 58264,Seattle,WA,27855 46th Ave S,Auburn,WA,98001
15,7853600045,Shannon K Hooper Trust,Hooper Shannon K Trust,,43670 Carmel Cir,Palm Desert,CA,31021 20th Ave S,Federal Way,WA,98003
25,421049032,Midway Samoan Assembly,Midway Samoan Assembly,,29276 Military Rd S,Federal Way,WA,29414 Military Rd S,Federal Way,WA,98003
29,7203000461,Mountain Niso LLC,Mountain Niso LLC,,PO Box 3482,Redmond,WA,28430 14th Ave S,Federal Way,WA,98003
34,4045700675,Orcas Homes LLC,Orcas Homes LLC,,12411 NE 80th Way,Kirkland,WA,3412 S 360th St,Auburn,WA,98001
35,5066400035,Overcomer Covenant Church,Overcomer Covenant Church,,33415 Military Rd S,Auburn,WA,33607 Military Rd S,Auburn,WA,98001
36,5066400120,Overcomer Covenant Church,Overcomer Covenant Church,,33415 Military Rd,Auburn,WA,4406 S 338th St,Auburn,WA,98001
37,3751604107,People Infra LLC,People Infra LLC,,4012 164th Ct NE,Redmond,WA,4200 S 360th St,Auburn,WA,98001
39,5151600415,Powell Rental Co,Powell Rental Co,,PO Box 66708,Burien,WA,1103 S 299th Pl,Federal Way,WA,98003
45,1547600150,Schneider Family Homes LLC,Schneider Family Homes LLC,,6510 Southcenter Blvd #1,Tukwila,WA,28202 48th Ave S,Auburn,WA,98001


In [48]:
mapped_cols[(mapped_cols.last_name.str.contains("Inc|Trust|LLC|L L C|Assembly|corp|Homes|Co", na=True, regex=True))]

Unnamed: 0,parcel,full_name,last_name,first_name,mail_add,mail_city,maill_state,prop_add,prop_city,prop_state,prop_zip
7,3321049039,Federal Way Central Presbyterian Co,Co,Federal Way Central Presbyterian,32210 24th Ave SW,Federal Way,WA,37427 28th Ave S,Federal Way,WA,98003
9,7967600261,Dimension Townhouses LLC,Dimension Townhouses LLC,,PO Box 58264,Seattle,WA,27855 46th Ave S,Auburn,WA,98001
15,7853600045,Shannon K Hooper Trust,Hooper Shannon K Trust,,43670 Carmel Cir,Palm Desert,CA,31021 20th Ave S,Federal Way,WA,98003
25,421049032,Midway Samoan Assembly,Midway Samoan Assembly,,29276 Military Rd S,Federal Way,WA,29414 Military Rd S,Federal Way,WA,98003
29,7203000461,Mountain Niso LLC,Mountain Niso LLC,,PO Box 3482,Redmond,WA,28430 14th Ave S,Federal Way,WA,98003
34,4045700675,Orcas Homes LLC,Orcas Homes LLC,,12411 NE 80th Way,Kirkland,WA,3412 S 360th St,Auburn,WA,98001
35,5066400035,Overcomer Covenant Church,Overcomer Covenant Church,,33415 Military Rd S,Auburn,WA,33607 Military Rd S,Auburn,WA,98001
36,5066400120,Overcomer Covenant Church,Overcomer Covenant Church,,33415 Military Rd,Auburn,WA,4406 S 338th St,Auburn,WA,98001
37,3751604107,People Infra LLC,People Infra LLC,,4012 164th Ct NE,Redmond,WA,4200 S 360th St,Auburn,WA,98001
39,5151600415,Powell Rental Co,Powell Rental Co,,PO Box 66708,Burien,WA,1103 S 299th Pl,Federal Way,WA,98003


In [73]:
mask = (
    (mapped_cols.full_name.str.contains(ENTITY_NAMES, na=True, regex=True)) |
    (mapped_cols.first_name.str.contains(ENTITY_NAMES, na=True, regex=True))|
    (mapped_cols.last_name.str.contains(ENTITY_NAMES, na=True, regex=True)) |
    (mapped_cols.first_name.str.len() < 2) |
    (mapped_cols.last_name.str.len() < 2)
)

In [74]:
incomplete = mapped_cols[mask]
complete = mapped_cols[~mask]

In [76]:
complete

Unnamed: 0,parcel,full_name,last_name,first_name,mail_add,mail_city,maill_state,prop_add,prop_city,prop_state,prop_zip
0,4045700220,Bonnie Anderson,Anderson,Bonnie,2210 Thea Ct,Milton,WA,35241 34th Ave S,Auburn,WA,98001
1,8856000493,Donald Anderson,Anderson,Donald,7348 25th Ave NW,Seattle,WA,308 1st Ave,Algona,WA,98001
2,6928600480,Timothy Berge,Berge,Timothy,624 SW 179th Place,Normandy Park,WA,30020 3rd Ave S,Federal Way,WA,98003
3,3751603633,Gregory Brock,Brock,Gregory,35919 53rd Av S,Auburn,WA,35848 54th Pl S,Auburn,WA,98001
4,221049095,Ross Brody,Brody,Ross,6542 21st Ave SW,Seattle,WA,29402 51st Ave S,Auburn,WA,98001
5,3356402380,Donna Brown,Brown,Donna,19637 Military Rd S,Seattle,WA,216 8th Ave N,Algona,WA,98001
6,1521049032,David Carpenter,Carpenter,David,13819 Military Rd E,Puyallup,WA,32734 39th Ave S,Federal Way,WA,98001
8,302000510,Christopher Defrang,Defrang,Christopher,1508 19th Ave,Longview,WA,5560 S 316th St,Auburn,WA,98001
10,1311600690,Joseph Fagg,Fagg,Joseph,PO Box 98752,Seattle,WA,3925 S 293rd St,Auburn,WA,98001
11,7263200020,Bradley Gehring,Gehring,Bradley,PO Box 972,Seahurst,WA,29929 Military Rd,Federal Way,WA,98003


In [77]:
complete.to_csv(f"./data/{filename}/clean.csv")
incomplete.to_csv(f"./data/{filename}/incomplete.csv")