In [52]:
import pandas as pd

# Read CSV files into DataFrames
intakes_df = pd.read_csv('Austin_Animal_Center_Intakes.csv')
outcomes_df = pd.read_csv('Austin_Animal_Center_Outcomes.csv')

# Check unique 'Animal ID' values before filtering duplicates
print("Unique Animal IDs in Intakes before filtering:", intakes_df['Animal ID'].nunique())
print("Unique Animal IDs in Outcomes before filtering:", outcomes_df['Animal ID'].nunique())

# Drop duplicates based on 'Animal ID' in both DataFrames
intakes_df = intakes_df.drop_duplicates(subset='Animal ID')
outcomes_df = outcomes_df.drop_duplicates(subset='Animal ID')

# Check unique 'Animal ID' values after filtering duplicates
print("Unique Animal IDs in Intakes after filtering:", intakes_df['Animal ID'].nunique())
print("Unique Animal IDs in Outcomes after filtering:", outcomes_df['Animal ID'].nunique())

# Set 'Animal ID' as the index for both DataFrames
intakes_df.set_index('Animal ID', inplace=True)
outcomes_df.set_index('Animal ID', inplace=True)

# Join the intake data with the outcome data based on the index ('Animal ID')
result_df = intakes_df.join(outcomes_df, how='inner', lsuffix='_intakes', rsuffix='_outcomes')

# Check unique 'Animal ID' values after the join
print("Unique Animal IDs in Result:", result_df.index.nunique())

# Reset the index to include 'Animal ID' as a column
result_df.reset_index(inplace=True)


Unique Animal IDs in Intakes before filtering: 58552
Unique Animal IDs in Outcomes before filtering: 29044
Unique Animal IDs in Intakes after filtering: 58552
Unique Animal IDs in Outcomes after filtering: 29044
Unique Animal IDs in Result: 28745


In [53]:
intakes_df.shape

(58552, 11)

In [54]:
outcomes_df.shape

(29044, 11)

In [55]:
result_df.shape

(28745, 23)

In [56]:
result_df.duplicated().sum()

0

In [57]:
result_df.head()

Unnamed: 0,Animal ID,Name_intakes,DateTime_intakes,MonthYear_intakes,Found Location,Intake Type,Intake Condition,Animal Type_intakes,Sex upon Intake,Age upon Intake,...,DateTime_outcomes,MonthYear_outcomes,Date of Birth,Outcome Type,Outcome Subtype,Animal Type_outcomes,Sex upon Outcome,Age upon Outcome,Breed_outcomes,Color_outcomes
0,A664887,*Gia,10/10/2013 01:48:00 PM,October 2013,1901 Onion Creek Pkwy in Austin (TX),Stray,Normal,Cat,Intact Female,1 month,...,11/10/2013 04:56:00 PM,Nov 2013,08/10/2013,Adoption,,Cat,Spayed Female,3 months,Domestic Shorthair Mix,Black
1,A665496,Mikey,10/18/2013 06:07:00 PM,October 2013,12001 Metric Blvd in Austin (TX),Stray,Normal,Cat,Neutered Male,3 years,...,10/22/2013 05:54:00 PM,Oct 2013,04/18/2010,Adoption,,Cat,Neutered Male,3 years,Bengal,Brown Tiger
2,A664936,*Jester,10/11/2013 11:20:00 AM,October 2013,501 U.S. 183 in Austin (TX),Stray,Normal,Cat,Intact Male,1 month,...,12/18/2013 06:18:00 PM,Dec 2013,08/18/2013,Adoption,,Cat,Neutered Male,4 months,Domestic Medium Hair Mix,Brown Tabby
3,A665398,Haven,10/17/2013 12:26:00 PM,October 2013,Austin (TX),Owner Surrender,Normal,Cat,Intact Female,1 month,...,11/10/2013 04:45:00 PM,Nov 2013,08/19/2013,Adoption,,Cat,Spayed Female,2 months,Domestic Shorthair Mix,White/Blue
4,A665426,Silka,10/17/2013 04:53:00 PM,October 2013,8224 Research Blvd #244 in Austin (TX),Stray,Normal,Cat,Intact Male,1 month,...,11/16/2013 05:09:00 PM,Nov 2013,08/26/2013,Adoption,,Cat,Neutered Male,2 months,Domestic Shorthair Mix,Black


In [58]:

result_df.to_csv("../dataset/Texas_Intake_and_Outcome.csv", index = False)

In [59]:
result_df.duplicated().sum()

0

In [60]:
# Read CSV 
reading = pd.read_csv("../dataset/Texas_Intake_and_Outcome.csv")
reading.head(50)

Unnamed: 0,Animal ID,Name_intakes,DateTime_intakes,MonthYear_intakes,Found Location,Intake Type,Intake Condition,Animal Type_intakes,Sex upon Intake,Age upon Intake,...,DateTime_outcomes,MonthYear_outcomes,Date of Birth,Outcome Type,Outcome Subtype,Animal Type_outcomes,Sex upon Outcome,Age upon Outcome,Breed_outcomes,Color_outcomes
0,A664887,*Gia,10/10/2013 01:48:00 PM,October 2013,1901 Onion Creek Pkwy in Austin (TX),Stray,Normal,Cat,Intact Female,1 month,...,11/10/2013 04:56:00 PM,Nov 2013,08/10/2013,Adoption,,Cat,Spayed Female,3 months,Domestic Shorthair Mix,Black
1,A665496,Mikey,10/18/2013 06:07:00 PM,October 2013,12001 Metric Blvd in Austin (TX),Stray,Normal,Cat,Neutered Male,3 years,...,10/22/2013 05:54:00 PM,Oct 2013,04/18/2010,Adoption,,Cat,Neutered Male,3 years,Bengal,Brown Tiger
2,A664936,*Jester,10/11/2013 11:20:00 AM,October 2013,501 U.S. 183 in Austin (TX),Stray,Normal,Cat,Intact Male,1 month,...,12/18/2013 06:18:00 PM,Dec 2013,08/18/2013,Adoption,,Cat,Neutered Male,4 months,Domestic Medium Hair Mix,Brown Tabby
3,A665398,Haven,10/17/2013 12:26:00 PM,October 2013,Austin (TX),Owner Surrender,Normal,Cat,Intact Female,1 month,...,11/10/2013 04:45:00 PM,Nov 2013,08/19/2013,Adoption,,Cat,Spayed Female,2 months,Domestic Shorthair Mix,White/Blue
4,A665426,Silka,10/17/2013 04:53:00 PM,October 2013,8224 Research Blvd #244 in Austin (TX),Stray,Normal,Cat,Intact Male,1 month,...,11/16/2013 05:09:00 PM,Nov 2013,08/26/2013,Adoption,,Cat,Neutered Male,2 months,Domestic Shorthair Mix,Black
5,A666091,Willy,10/26/2013 04:43:00 PM,October 2013,5300 Pecan Brook in Austin (TX),Stray,Normal,Cat,Intact Male,1 month,...,12/06/2013 03:54:00 PM,Dec 2013,09/11/2013,Adoption,Foster,Cat,Neutered Male,2 months,Domestic Medium Hair Mix,Black/White
6,A665994,*Lihue,10/25/2013 05:41:00 PM,October 2013,N Ih 35 in Austin (TX),Stray,Normal,Cat,Intact Female,3 months,...,11/05/2013 07:22:00 PM,Nov 2013,07/25/2013,Adoption,,Cat,Spayed Female,3 months,Domestic Shorthair Mix,Calico
7,A664857,,10/10/2013 07:47:00 AM,October 2013,Old Bee Caves And Hwy 71 in Austin (TX),Stray,Normal,Cat,Intact Male,6 months,...,10/14/2013 05:34:00 PM,Oct 2013,04/10/2013,Adoption,,Cat,Neutered Male,6 months,Domestic Shorthair Mix,Black/White
8,A664754,,10/08/2013 04:46:00 PM,October 2013,Austin (TX),Owner Surrender,Normal,Cat,Intact Male,5 months,...,10/13/2013 06:03:00 PM,Oct 2013,04/23/2013,Adoption,,Cat,Neutered Male,5 months,Domestic Shorthair Mix,Black
9,A664446,*Riley,10/03/2013 01:06:00 PM,October 2013,6201 E 290 in Austin (TX),Stray,Injured,Cat,Intact Male,3 years,...,03/15/2014 03:27:00 PM,Mar 2014,10/03/2010,Adoption,Foster,Cat,Neutered Male,3 years,Domestic Shorthair Mix,Orange Tabby
