# Clean Covid-19 Data

In [None]:
import pandas as pd
import numpy as np

In [None]:
# source: https://health.google.com/covid-19/open-data/explorer?loc=US_KY_21111
df= pd.read_csv('assets/US_KY_21111.csv')
df.info()

In [None]:
# Use list() to print entire columns list to screen. Without it, the columns are truncated.
list(df.columns)


In [None]:
dropped_columns = ['location_key',
 'place_id',
 'wikidata_id',
 'datacommons_id',
 'country_code',
 'country_name',
 'subregion1_code',
 'subregion2_code',
 'iso_3166_1_alpha_2',
 'iso_3166_1_alpha_3',
 'aggregation_level',
 'openstreetmap_id',
 'latitude',
 'longitude',
 'area_sq_km',
 'mobility_retail_and_recreation',
 'mobility_grocery_and_pharmacy',
 'mobility_parks',
 'mobility_transit_stations',
 'mobility_workplaces',
 'mobility_residential',
 'search_trends_abdominal_obesity',
 'search_trends_abdominal_pain',
 'search_trends_acne',
 'search_trends_actinic_keratosis',
 'search_trends_acute_bronchitis',
 'search_trends_adrenal_crisis',
 'search_trends_ageusia',
 'search_trends_alcoholism',
 'search_trends_allergy',
 'search_trends_amblyopia',
 'search_trends_amenorrhea',
 'search_trends_amnesia',
 'search_trends_anal_fissure',
 'search_trends_anaphylaxis',
 'search_trends_anemia',
 'search_trends_angina_pectoris',
 'search_trends_angioedema',
 'search_trends_anosmia',
 'search_trends_anxiety',
 'search_trends_aphasia',
 'search_trends_apnea',
 'search_trends_arthralgia',
 'search_trends_arthritis',
 'search_trends_ascites',
 'search_trends_asperger_syndrome',
 'search_trends_asphyxia',
 'search_trends_asthma',
 'search_trends_astigmatism',
 'search_trends_ataxia',
 'search_trends_atheroma',
 'search_trends_attention_deficit_hyperactivity_disorder',
 'search_trends_autoimmune_disease',
 'search_trends_avoidant_personality_disorder',
 'search_trends_back_pain',
 'search_trends_bacterial_vaginosis',
 'search_trends_balance_disorder',
 'search_trends_beaus_lines',
 'search_trends_bells_palsy',
 'search_trends_biliary_colic',
 'search_trends_binge_eating',
 'search_trends_bleeding',
 'search_trends_bleeding_on_probing',
 'search_trends_blepharospasm',
 'search_trends_bloating',
 'search_trends_blood_in_stool',
 'search_trends_blurred_vision',
 'search_trends_blushing',
 'search_trends_boil',
 'search_trends_bone_fracture',
 'search_trends_bone_tumor',
 'search_trends_bowel_obstruction',
 'search_trends_bradycardia',
 'search_trends_braxton_hicks_contractions',
 'search_trends_breakthrough_bleeding',
 'search_trends_breast_pain',
 'search_trends_bronchitis',
 'search_trends_bruise',
 'search_trends_bruxism',
 'search_trends_bunion',
 'search_trends_burn',
 'search_trends_burning_mouth_syndrome',
 'search_trends_candidiasis',
 'search_trends_canker_sore',
 'search_trends_cardiac_arrest',
 'search_trends_carpal_tunnel_syndrome',
 'search_trends_cataplexy',
 'search_trends_cataract',
 'search_trends_chancre',
 'search_trends_cheilitis',
 'search_trends_chest_pain',
 'search_trends_chills',
 'search_trends_chorea',
 'search_trends_chronic_pain',
 'search_trends_cirrhosis',
 'search_trends_cleft_lip_and_cleft_palate',
 'search_trends_clouding_of_consciousness',
 'search_trends_cluster_headache',
 'search_trends_colitis',
 'search_trends_coma',
 'search_trends_common_cold',
 'search_trends_compulsive_behavior',
 'search_trends_compulsive_hoarding',
 'search_trends_confusion',
 'search_trends_congenital_heart_defect',
 'search_trends_conjunctivitis',
 'search_trends_constipation',
 'search_trends_convulsion',
 'search_trends_cough',
 'search_trends_cramp',
 'search_trends_crepitus',
 'search_trends_croup',
 'search_trends_cyanosis',
 'search_trends_dandruff',
 'search_trends_delayed_onset_muscle_soreness',
 'search_trends_dementia',
 'search_trends_dentin_hypersensitivity',
 'search_trends_depersonalization',
 'search_trends_depression',
 'search_trends_dermatitis',
 'search_trends_desquamation',
 'search_trends_developmental_disability',
 'search_trends_diabetes',
 'search_trends_diabetic_ketoacidosis',
 'search_trends_diarrhea',
 'search_trends_dizziness',
 'search_trends_dry_eye_syndrome',
 'search_trends_dysgeusia',
 'search_trends_dysmenorrhea',
 'search_trends_dyspareunia',
 'search_trends_dysphagia',
 'search_trends_dysphoria',
 'search_trends_dystonia',
 'search_trends_dysuria',
 'search_trends_ear_pain',
 'search_trends_eczema',
 'search_trends_edema',
 'search_trends_encephalitis',
 'search_trends_encephalopathy',
 'search_trends_epidermoid_cyst',
 'search_trends_epilepsy',
 'search_trends_epiphora',
 'search_trends_erectile_dysfunction',
 'search_trends_erythema',
 'search_trends_erythema_chronicum_migrans',
 'search_trends_esophagitis',
 'search_trends_excessive_daytime_sleepiness',
 'search_trends_eye_pain',
 'search_trends_eye_strain',
 'search_trends_facial_nerve_paralysis',
 'search_trends_facial_swelling',
 'search_trends_fasciculation',
 'search_trends_fatigue',
 'search_trends_fatty_liver_disease',
 'search_trends_fecal_incontinence',
 'search_trends_fever',
 'search_trends_fibrillation',
 'search_trends_fibrocystic_breast_changes',
 'search_trends_fibromyalgia',
 'search_trends_flatulence',
 'search_trends_floater',
 'search_trends_focal_seizure',
 'search_trends_folate_deficiency',
 'search_trends_food_craving',
 'search_trends_food_intolerance',
 'search_trends_frequent_urination',
 'search_trends_gastroesophageal_reflux_disease',
 'search_trends_gastroparesis',
 'search_trends_generalized_anxiety_disorder',
 'search_trends_genital_wart',
 'search_trends_gingival_recession',
 'search_trends_gingivitis',
 'search_trends_globus_pharyngis',
 'search_trends_goitre',
 'search_trends_gout',
 'search_trends_grandiosity',
 'search_trends_granuloma',
 'search_trends_guilt',
 'search_trends_hair_loss',
 'search_trends_halitosis',
 'search_trends_hay_fever',
 'search_trends_headache',
 'search_trends_heart_arrhythmia',
 'search_trends_heart_murmur',
 'search_trends_heartburn',
 'search_trends_hematochezia',
 'search_trends_hematoma',
 'search_trends_hematuria',
 'search_trends_hemoptysis',
 'search_trends_hemorrhoids',
 'search_trends_hepatitis',
 'search_trends_hepatotoxicity',
 'search_trends_hiccup',
 'search_trends_hip_pain',
 'search_trends_hives',
 'search_trends_hot_flash',
 'search_trends_hydrocephalus',
 'search_trends_hypercalcaemia',
 'search_trends_hypercholesterolemia',
 'search_trends_hyperemesis_gravidarum',
 'search_trends_hyperglycemia',
 'search_trends_hyperhidrosis',
 'search_trends_hyperkalemia',
 'search_trends_hyperlipidemia',
 'search_trends_hypermobility',
 'search_trends_hyperpigmentation',
 'search_trends_hypersomnia',
 'search_trends_hypertension',
 'search_trends_hyperthermia',
 'search_trends_hyperthyroidism',
 'search_trends_hypertriglyceridemia',
 'search_trends_hypertrophy',
 'search_trends_hyperventilation',
 'search_trends_hypocalcaemia',
 'search_trends_hypochondriasis',
 'search_trends_hypoglycemia',
 'search_trends_hypogonadism',
 'search_trends_hypokalemia',
 'search_trends_hypomania',
 'search_trends_hyponatremia',
 'search_trends_hypotension',
 'search_trends_hypothyroidism',
 'search_trends_hypoxemia',
 'search_trends_hypoxia',
 'search_trends_impetigo',
 'search_trends_implantation_bleeding',
 'search_trends_impulsivity',
 'search_trends_indigestion',
 'search_trends_infection',
 'search_trends_inflammation',
 'search_trends_inflammatory_bowel_disease',
 'search_trends_ingrown_hair',
 'search_trends_insomnia',
 'search_trends_insulin_resistance',
 'search_trends_intermenstrual_bleeding',
 'search_trends_intracranial_pressure',
 'search_trends_iron_deficiency',
 'search_trends_irregular_menstruation',
 'search_trends_itch',
 'search_trends_jaundice',
 'search_trends_kidney_failure',
 'search_trends_kidney_stone',
 'search_trends_knee_pain',
 'search_trends_kyphosis',
 'search_trends_lactose_intolerance',
 'search_trends_leg_cramps',
 'search_trends_lesion',
 'search_trends_leukorrhea',
 'search_trends_lightheadedness',
 'search_trends_low_back_pain',
 'search_trends_low_grade_fever',
 'search_trends_lymphedema',
 'search_trends_major_depressive_disorder',
 'search_trends_malabsorption',
 'search_trends_male_infertility',
 'search_trends_manic_disorder',
 'search_trends_melasma',
 'search_trends_melena',
 'search_trends_meningitis',
 'search_trends_menorrhagia',
 'search_trends_middle_back_pain',
 'search_trends_migraine',
 'search_trends_milium',
 'search_trends_mitral_insufficiency',
 'search_trends_mood_disorder',
 'search_trends_mood_swing',
 'search_trends_morning_sickness',
 'search_trends_motion_sickness',
 'search_trends_mouth_ulcer',
 'search_trends_muscle_atrophy',
 'search_trends_muscle_weakness',
 'search_trends_myalgia',
 'search_trends_mydriasis',
 'search_trends_myocardial_infarction',
 'search_trends_nasal_congestion',
 'search_trends_nausea',
 'search_trends_neck_mass',
 'search_trends_neck_pain',
 'search_trends_neonatal_jaundice',
 'search_trends_nerve_injury',
 'search_trends_neuralgia',
 'search_trends_neutropenia',
 'search_trends_night_sweats',
 'search_trends_night_terror',
 'search_trends_nocturnal_enuresis',
 'search_trends_nodule',
 'search_trends_nosebleed',
 'search_trends_nystagmus',
 'search_trends_obesity',
 'search_trends_onychorrhexis',
 'search_trends_oral_candidiasis',
 'search_trends_orthostatic_hypotension',
 'search_trends_osteopenia',
 'search_trends_osteophyte',
 'search_trends_osteoporosis',
 'search_trends_otitis',
 'search_trends_otitis_externa',
 'search_trends_otitis_media',
 'search_trends_pain',
 'search_trends_palpitations',
 'search_trends_pancreatitis',
 'search_trends_panic_attack',
 'search_trends_papule',
 'search_trends_paranoia',
 'search_trends_paresthesia',
 'search_trends_pelvic_inflammatory_disease',
 'search_trends_pericarditis',
 'search_trends_periodontal_disease',
 'search_trends_periorbital_puffiness',
 'search_trends_peripheral_neuropathy',
 'search_trends_perspiration',
 'search_trends_petechia',
 'search_trends_phlegm',
 'search_trends_photophobia',
 'search_trends_photopsia',
 'search_trends_pleural_effusion',
 'search_trends_pleurisy',
 'search_trends_pneumonia',
 'search_trends_podalgia',
 'search_trends_polycythemia',
 'search_trends_polyneuropathy',
 'search_trends_polyuria',
 'search_trends_poor_posture',
 'search_trends_post_nasal_drip',
 'search_trends_postural_orthostatic_tachycardia_syndrome',
 'search_trends_prediabetes',
 'search_trends_proteinuria',
 'search_trends_pruritus_ani',
 'search_trends_psychosis',
 'search_trends_ptosis',
 'search_trends_pulmonary_edema',
 'search_trends_pulmonary_hypertension',
 'search_trends_purpura',
 'search_trends_pus',
 'search_trends_pyelonephritis',
 'search_trends_radiculopathy',
 'search_trends_rectal_prolapse',
 'search_trends_red_eye',
 'search_trends_renal_colic',
 'search_trends_restless_legs_syndrome',
 'search_trends_rheum',
 'search_trends_rhinitis',
 'search_trends_rhinorrhea',
 'search_trends_rosacea',
 'search_trends_round_ligament_pain',
 'search_trends_rumination',
 'search_trends_scar',
 'search_trends_sciatica',
 'search_trends_scoliosis',
 'search_trends_seborrheic_dermatitis',
 'search_trends_self_harm',
 'search_trends_sensitivity_to_sound',
 'search_trends_sexual_dysfunction',
 'search_trends_sharp_pain',
 'search_trends_shivering',
 'search_trends_shortness_of_breath',
 'search_trends_shyness',
 'search_trends_sinusitis',
 'search_trends_skin_condition',
 'search_trends_skin_rash',
 'search_trends_skin_tag',
 'search_trends_skin_ulcer',
 'search_trends_sleep_apnea',
 'search_trends_sleep_deprivation',
 'search_trends_sleep_disorder',
 'search_trends_snoring',
 'search_trends_sore_throat',
 'search_trends_spasticity',
 'search_trends_splenomegaly',
 'search_trends_sputum',
 'search_trends_stomach_rumble',
 'search_trends_strabismus',
 'search_trends_stretch_marks',
 'search_trends_stroke',
 'search_trends_stuttering',
 'search_trends_subdural_hematoma',
 'search_trends_suicidal_ideation',
 'search_trends_swelling',
 'search_trends_swollen_feet',
 'search_trends_swollen_lymph_nodes',
 'search_trends_syncope',
 'search_trends_tachycardia',
 'search_trends_tachypnea',
 'search_trends_telangiectasia',
 'search_trends_tenderness',
 'search_trends_testicular_pain',
 'search_trends_throat_irritation',
 'search_trends_thrombocytopenia',
 'search_trends_thyroid_nodule',
 'search_trends_tic',
 'search_trends_tinnitus',
 'search_trends_tonsillitis',
 'search_trends_toothache',
 'search_trends_tremor',
 'search_trends_trichoptilosis',
 'search_trends_tumor',
 'search_trends_type_2_diabetes',
 'search_trends_unconsciousness',
 'search_trends_underweight',
 'search_trends_upper_respiratory_tract_infection',
 'search_trends_urethritis',
 'search_trends_urinary_incontinence',
 'search_trends_urinary_tract_infection',
 'search_trends_uterine_contraction',
 'search_trends_vaginal_bleeding',
 'search_trends_vaginal_discharge',
 'search_trends_vaginitis',
 'search_trends_varicose_veins',
 'search_trends_vasculitis',
 'search_trends_ventricular_tachycardia',
 'search_trends_vertigo',
 'search_trends_visual_acuity',
 'search_trends_vomiting',
 'search_trends_wart',
 'search_trends_water_retention',
 'search_trends_weakness',
 'search_trends_weight_gain',
 'search_trends_wheeze',
 'search_trends_xeroderma',
 'search_trends_xerostomia',
 'search_trends_yawn',
 'average_temperature_celsius',
 'minimum_temperature_celsius',
 'maximum_temperature_celsius',
 'rainfall_mm',
 'snowfall_mm',
 'dew_point',
 'relative_humidity']

In [None]:
# Drop unnecessary columns
df.drop(columns= dropped_columns, inplace=True)

In [None]:
df.info()

In [None]:
# Rename for clarity
df.rename(columns={'subregion1_name':'state',
                   'subregion2_name':'county',
                   'population':'total_population'}, inplace=True)

In [None]:
df.head(3)

In [None]:
# Convert dates to datetime
df['date'] = pd.to_datetime(df['date'])

# Simplify dates to Month/Year format.
df['date'] = df['date'].dt.strftime('%B %Y')

In [None]:
df

In [None]:
# all population data shows no change accross the data set so I will actually go ahead and drop those columns as well.
df = df.drop(columns=['total_population',
 'population_male',
 'population_female',
 'population_age_00_09',
 'population_age_10_19',
 'population_age_20_29',
 'population_age_30_39',
 'population_age_40_49',
 'population_age_50_59',
 'population_age_60_69',
 'population_age_70_79',
 'population_age_80_and_older',
 'life_expectancy'])
df.info()