# White House visitor logs

### Import Python tools and Jupyter configuration

In [1]:
%load_ext lab_black

In [2]:
import pandas as pd
import datetime as dt
import altair as alt
import numpy as np

In [3]:
pd.options.display.max_columns = 1000
pd.options.display.max_rows = 1000
alt.data_transformers.disable_max_rows()
pd.options.display.max_colwidth = None

### Data dictionary

In [4]:
# "https://obamawhitehouse.archives.gov/files/disclosures/visitors/WhiteHouse-WAVES-Key-1209.txt"

In [5]:
today = dt.date.today().strftime("%m-%d-%Y")

In [6]:
df = pd.read_csv(
    "data/processed/log_latest.csv",
    parse_dates=[
        "appt_made_date",
        "appt_start_date",
        "appt_end_date",
        "appt_cancel_date",
        "releasedate",
    ],
)

In [7]:
df.sort_values(["appt_made_date"], ascending=False).head()

Unnamed: 0,namelast,namefirst,namemid,uin,bdgnbr,access_type,toa,poa,tod,pod,appt_made_date,appt_start_date,appt_end_date,appt_cancel_date,total_people,last_updatedby,post,lastentrydate,terminal_suffix,visitee_namelast,visitee_namefirst,meeting_loc,meeting_room,caller_name_last,caller_name_first,caller_room,releasedate,description
4868,HARKINS,CHRISTINE,P,U36027,,VA,NAN,NAN,NAN,NAN,2021-11-30 11:57:00,2021-11-30 14:00:00,2021-11-30 23:59:00,NaT,1.0,DN,WIN,11/30/2021 11:57,DN,NELSON,DAVID,VPR,VPR,NELSON,DAVID,,2022-03-11,NAN
7944,PETERS,KATIE,J,U36004,,VA,NAN,NAN,NAN,NAN,2021-11-30 09:26:00,2021-11-30 12:00:00,2021-11-30 23:59:00,NaT,5.0,KG,WIN,11/30/2021 9:26,KG,NAN,PLAYMAKER,VPR,RESIDENCE,GOODHUE,KEVIN,,2022-03-11,NAN
7943,JAVAID,ZAINA,N,U36004,,VA,NAN,NAN,NAN,NAN,2021-11-30 09:26:00,2021-11-30 12:00:00,2021-11-30 23:59:00,NaT,5.0,KG,WIN,11/30/2021 9:26,KG,NAN,PLAYMAKER,VPR,RESIDENCE,GOODHUE,KEVIN,,2022-03-11,NAN
7942,CREWS,ARLENE,N,U36004,,VA,NAN,NAN,NAN,NAN,2021-11-30 09:26:00,2021-11-30 12:00:00,2021-11-30 23:59:00,NaT,5.0,KG,WIN,11/30/2021 9:26,KG,NAN,PLAYMAKER,VPR,RESIDENCE,GOODHUE,KEVIN,,2022-03-11,NAN
5360,SINGLA,RUKKU,N,U36004,,VA,NAN,NAN,NAN,NAN,2021-11-30 09:26:00,2021-11-30 12:00:00,2021-11-30 23:59:00,NaT,5.0,KG,WIN,11/30/2021 9:26,KG,NAN,PLAYMAKER,VPR,RESIDENCE,GOODHUE,KEVIN,,2022-03-11,NAN


### Buildings

In [8]:
df.meeting_loc.value_counts()

OEOB    12255
WH      10483
NEOB     1255
VPR      1102
EEOB      837
NAN       737
Name: meeting_loc, dtype: int64

### Rooms 

In [9]:
df.meeting_room.value_counts().head()

SOUTH LAWN    1976
RES - STAT    1479
EW206         1220
445           1063
374           1011
Name: meeting_room, dtype: int64

### Who's visited the Oval?

In [10]:
len(df[df["meeting_room"].str.contains("OVAL")])

478

In [11]:
df[df["meeting_room"].str.contains("OVAL")].head()

Unnamed: 0,namelast,namefirst,namemid,uin,bdgnbr,access_type,toa,poa,tod,pod,appt_made_date,appt_start_date,appt_end_date,appt_cancel_date,total_people,last_updatedby,post,lastentrydate,terminal_suffix,visitee_namelast,visitee_namefirst,meeting_loc,meeting_room,caller_name_last,caller_name_first,caller_room,releasedate,description
170,FAUVRE,LEO,B,U24904,,VA,5/14/2021 10:47,B0401,NAN,NAN,2021-05-13 10:33:00,2021-05-14 10:30:00,2021-05-14 23:59:00,NaT,4.0,PS,WIN,5/13/2021 10:33,PS,NAN,POTUS,WH,OVAL OFFIC,SINGH,PRIYA,,2021-08-30,NAN
181,SMITH,GAYLE,E,U24948,,VA,NAN,NAN,NAN,NAN,2021-05-14 07:02:00,2021-05-14 12:45:00,2021-05-14 23:59:00,NaT,1.0,AW,WIN,5/14/2021 7:02,AW,NAN,POTUS,WH,OVAL,WITHERS,ANNE,,2021-08-30,NAN
185,LATTHIVONGSKORN,JIRAYUT,N,U24901,179726.0,VA,5/14/2021 13:24,B0401,5/14/2021 17:20,A05,2021-05-13 09:05:00,2021-05-14 13:00:00,2021-05-14 23:59:00,NaT,7.0,NS,WIN,5/13/2021 9:05,NS,NAN,POTUS,WH,OVAL OFFIC,SILVA,NEZLY,,2021-08-30,NAN
189,PRAELIANGULO,MARIA,N,U24901,178274.0,VA,5/14/2021 13:21,B0401,5/14/2021 17:20,A05,2021-05-13 09:05:00,2021-05-14 13:00:00,2021-05-14 23:59:00,NaT,7.0,NS,WIN,5/13/2021 9:05,NS,NAN,POTUS,WH,OVAL OFFIC,SILVA,NEZLY,,2021-08-30,NAN
190,RANGELPEREZ,LEYDY,M,U24901,178054.0,VA,5/14/2021 13:21,B0401,NAN,NAN,2021-05-13 09:05:00,2021-05-14 13:00:00,2021-05-14 23:59:00,NaT,7.0,NS,WIN,5/13/2021 9:05,NS,NAN,POTUS,WH,OVAL OFFIC,SILVA,NEZLY,,2021-08-30,NAN


### Where meeting room is ...

In [12]:
df[df["meeting_room"].str.contains("EW206")].head()

Unnamed: 0,namelast,namefirst,namemid,uin,bdgnbr,access_type,toa,poa,tod,pod,appt_made_date,appt_start_date,appt_end_date,appt_cancel_date,total_people,last_updatedby,post,lastentrydate,terminal_suffix,visitee_namelast,visitee_namefirst,meeting_loc,meeting_room,caller_name_last,caller_name_first,caller_room,releasedate,description
338,MACKALL,LEE,A,U25238,,VA,NAN,NAN,NAN,NAN,2021-05-20 13:00:00,2021-05-21 10:00:00,2021-05-21 23:59:00,NaT,31.0,DV,WIN,5/20/2021 13:00,DV,NAN,POTUS,WH,EW206,VIA,DANIEL,,2021-08-30,NAN
339,MAHONEY,ROBERT,P,U25238,,VA,NAN,NAN,NAN,NAN,2021-05-20 13:00:00,2021-05-21 10:00:00,2021-05-21 23:59:00,NaT,31.0,DV,WIN,5/20/2021 13:00,DV,NAN,POTUS,WH,EW206,VIA,DANIEL,,2021-08-30,NAN
340,MASLINE,XAVIERA,J,U25238,,VA,NAN,NAN,NAN,NAN,2021-05-20 09:06:00,2021-05-21 10:00:00,2021-05-21 23:59:00,NaT,31.0,DV,WIN,5/20/2021 9:06,DV,NAN,POTUS,WH,EW206,VIA,DANIEL,,2021-08-30,NAN
341,MAXON,ERIC,D,U25238,,VA,NAN,NAN,NAN,NAN,2021-05-20 09:06:00,2021-05-21 10:00:00,2021-05-21 23:59:00,NaT,31.0,DV,WIN,5/20/2021 9:06,DV,NAN,POTUS,WH,EW206,VIA,DANIEL,,2021-08-30,NAN
343,ORTMAN,JUSTIN,D,U25238,,VA,NAN,NAN,NAN,NAN,2021-05-20 09:06:00,2021-05-21 10:00:00,2021-05-21 23:59:00,NaT,31.0,DV,WIN,5/20/2021 9:06,DV,NAN,POTUS,WH,EW206,VIA,DANIEL,,2021-08-30,NAN


### Where 'visitee' is explicity the Vice President

In [13]:
len(df[df["visitee_namefirst"].str.contains("VPOTUS")])

131

In [14]:
df[df["visitee_namefirst"].str.contains("VPOTUS")].to_csv(
    "data/processed/vpotus_visitee.csv", index=False
)