# Challenge NabuMinds - Thiago Sequeira

## Data Cleaning & Preparation for Visualization

In [51]:
import pandas as pd
import numpy as np

### Dictionaries

In [52]:
user_timezone_dic = {
    'Eastern Time (US & Canada)': 'America',
    'Pacific Time (US & Canada)': 'America',
    'Central Time (US & Canada)': 'America',
    'La Paz': 'Bolivia',
    'America/New_York': 'America',
    'Atlantic Time (Canada)': 'Canada',
    'Quito': 'Ecuador',
    'Mountain Time (US & Canada)': 'America',
    'Vienna': 'Austria',
    'Caracas': 'Venezuela',
    'Kuala Lumpur': 'Malaysia',
    'Brisbane': 'Australia',
    'Arizona': 'America',
    'London': 'United Kingdom',
    'Tehran': 'Iran',
    'Alaska': 'America',
    'Sydney': 'Australia',
    'Irkutsk': 'Russia',
    'Santiago': 'Chile',
    'Amsterdam': 'Netherlands',
    'Tijuana': 'Mexico',
    'Abu Dhabi': 'United Arab Emirates',
    'Central America': 'Central America',
    'Edinburgh': 'United Kingdom',
    'Jerusalem': 'Israel',
    'Hawaii': 'America',
    'Paris': 'France',
    'Guam': 'Guam',
    'New Delhi': 'India',
    'Stockholm': 'Sweden',
    'America/Chicago': 'America',
    'Berlin': 'Germany',
    'Madrid': 'Spain',
    'Athens': 'Greece',
    'Brussels': 'Belgium',
    'Taipei': 'Taiwan',
    'Rome': 'Italy',
    'Beijing': 'China',
    'Mexico City': 'Mexico',
    'Bern': 'Switzerland',
    'Singapore': 'Singapore',
    'Indiana (East)': 'America',
    'Melbourne': 'Australia',
    'Saskatchewan': 'Canada',
    'Casablanca': 'Morocco',
    'Brasilia': 'Brazil',
    'Kyiv': 'Ukraine',
    'Bucharest': 'Romania',
    'Greenland': 'Greenland',
    'Prague': 'Czech Republic',
    'New Caledonia': 'New Caledonia',
    'Bogota': 'Colombia',
    'Seoul': 'South Korea',
    'Sarajevo': 'Bosnia and Herzegovina',
    'Wellington': 'New Zealand',
    'Bangkok': 'Thailand',
    'Warsaw': 'Poland',
    'Copenhagen': 'Denmark',
    'Hong Kong': 'Hong Kong',
    'Guadalajara': 'Mexico',
    'Mid-Atlantic': 'Mid-Atlantic',
    'Mazatlan': 'Mexico',
    'Buenos Aires': 'Argentina',
    'America/Los_Angeles': 'America',
    'Dublin': 'Ireland',
    'Lisbon': 'Portugal',
    'Newfoundland': 'Canada',
    'Monterrey': 'Mexico',
    'Tokyo': 'Japan',
    'America/Detroit': 'America',
    'Midway Island': 'America',
    'Istanbul': 'Turkey',
    'Solomon Is.': 'Solomon Islands',
    'America/Atikokan': 'Canada',
    'Adelaide': 'Australia',
    'Nairobi': 'Kenya',
    'EST': 'America',
    'Lima': 'Peru',
    'Islamabad': 'Pakistan',
    'Helsinki': 'Finland',
    'Pretoria': 'South Africa',
    'West Central Africa': 'West Central Africa',
    'America/Boise': 'America',
    'Canberra': 'Australia',
    'Perth': 'Australia',
    'La Paz.': 'Bolivia'
}

In [53]:
tweet_location_dic = {
    "San Mateo, CA & Las Vegas, NV": "America",
    "Central Texas": "America",
    "brighton, uk": "UK",
    "allen, tx": "America",
    "belle mo": "America",
    "connecticut": "America",
    "long island - arizona": "America",
    "nürnberg, germany ": "Germany",
    "atlanta, ga": "America",
    "washington, dc. ": "America",
    "puerto rico": "Puerto Rico",
    "dc": "America",
    "las vegas": "America",
    "chandler, az": "America",
    "albany, ny": "America",
    "albuquerque, new mexico": "America",
    "america": "America",
    "anaheim": "America",
    "arlington, virginia": "America",
    "atlanta": "America",
    "atlanta ga": "America",
    "auburn, me": "America",
    "austin, texas": "America",
    "baltimore": "America",
    "barcelona": "Spain",
    "baton rouge, la": "America",
    "bay area, ca.": "America",
    "birmingham, al": "America",
    "boston": "America",
    "boston college": "America",
    "brantford": "Canada",
    "brooklyn, ny, us": "America",
    "buffalo": "America",
    "bushwood": "America",
    "california": "America",
    "canada": "Canada",
    "carlsbad | ca": "America",
    "central mass": "America",
    "charleston, sc": "America",
    "cheltenham": "UK",
    "chicago area": "America",
    "chicagoland": "America",
    "cincinnati, ohio": "America",
    "colombia": "Colombia",
    "colorado": "America",
    "columbus": "America",
    "conway, ar": "America",
    "cranberry 16066/bonita springs": "America",
    "dallas tx": "America",
    "dallas, tx": "America",
    "dallas,texas": "America",
    "dc": "America",
    "denver co": "America",
    "denver, co": "America",
    "detroit, michigan": "America",
    "dorado": "America",
    "douglas, ma": "America",
    "dublin, ireland": "Ireland",
    "east coast, us": "America",
    "eau claire": "America",
    "evanston illinois": "America",
    "florida": "America",
    "fort lee, nj": "America",
    "foster city, ca": "America",
    "ft collins": "America",
    "ft lauderdale": "America",
    "fullerton, ca": "America",
    "georgia": "America",
    "grandville, michigan": "America",
    "great lakes": "America",
    "greater geelong": "Australia",
    "greensboro nc": "America",
    "hanover, maryland": "America",
    "happy valley, oregon": "America",
    "hershey, pa": "America",
    "home: iad, college: jfk": "America",
    "hoover, alabama": "America",
    "hopatcong, nj": "America",
    "houston tx": "America",
    "htown": "America",
    "iowa state university": "America",
    "island of oahu, hawaii": "America",
    "jamestown virginia": "America",
    "jersey city": "America",
    "jetblue t5 at jfk": "America",
    "kalispell montana": "America",
    "kansas city, missouri": "America",
    "kc": "America",
    "kcmo": "America",
    "kentuckinmyshirt": "America",
    "key west to bar harbor": "America",
    "kingwood": "America",
    "kokomo, in": "America",
    "la": "America",
    "la jolla, california": "America",
    "lantana, tx usa": "America",
    "lexington ky": "America",
    "london": "UK",
    "long beach": "America",
    "long beach, ny": "America",
    "long island": "America",
    "los angeles by way of philly": "America",
    "los angeles, new orleans!": "America",
    "los gatos, ca": "America",
    "louisville, ky.": "America",
    "ma": "America",
    "mabel, mn": "America",
    "mammoth lakes": "America",
    "manchester,ct": "America",
    "manhattan.": "America",
    "marblehead, ma": "America",
    "massachusetts": "America",
    "memphis": "America",
    "merica": "America",
    "merrimack nh": "America",
    "miami beach, florida": "America",
    "miami, fl": "America",
    "miami, florida": "America",
    "middletown, ct": "America",
    "midlothian, virginia": "America",
    "midwest": "America",
    "midwest and sometimes spain": "America",
    "mill creek hs": "America",
    "milton, massachusetts": "America",
    "milwaukee, wi": "America",
    "mustang, oklahoma": "America",
    "naples, fl": "America",
    "nashville,tn": "America",
    "near los angeles ca": "America",
    "new canaan, ct": "America",
    "new england": "America",
    "new hampshire": "America",
    "new york": "America",
    "new york city": "America",
    "new york, new york": "America",
    "new yorker stranded in pa": "America",
    "north hollywood, ca": "America",
    "north plainfield, nj": "America",
    "north shore massachusetts": "America",
    "north tonawanda": "America",
    "nürnberg, germany": "Germany",
    "ny (globetrotter.exbonaerense)": "America",
    "ny ny": "America",
    "ny,ny": "America",
    "nyc": "America",
    "nyc // li": "America",
    "nyc | nola": "America",
    "nyc/austin": "America",
    "nyc/london": "America",
    "nyc✈️mia": "America",
    "ocean view, hawaii": "America",
    "ohio": "America",
    "ohio & kentucky": "America",
    "ohio,panama": "America",
    "old city philly": "America",
    "omaha": "America",
    "orchard park, ny": "America",
    "orlando": "America",
    "overland park, ks": "America",
    "pa": "America",
    "panamá": "Panama",
    "paramus, nj": "America",
    "park city": "America",
    "pensacola": "America",
    "perdido key, fl": "America",
    "pescadero, ca": "America",
    "philadelphia": "America",
    "philadelphia pa": "America",
    "philadelphia, usa": "America",
    "philly burbs": "America",
    "phl": "America",
    "pittsburgh": "America",
    "plain ol plano, tx": "America",
    "plano, tx": "America",
    "plymouth": "America",
    "portland, oregon": "America",
    "portsmouth, uk": "UK",
    "pr/miami/san francisco": "America",
    "puerto rico": "Puerto Rico",
    "queencity, usa": "America",
    "queens, ny": "America",
    "radford hs": "America",
    "renton, wa": "America",
    "rhode island": "America",
    "florida, usa": "America",
    "fort lauderdale": "America",
    "greenwich, ct": "America",
    "long island - arizona": "America",
    "naples, fl, boston, ma": "Italy",
    "Los Angeles": "America",
    "Turks and caicos": "Turks and Caicos Islands",
    "UK, USA.": "UK",
    "Manhattan Beach, CA": "America",
    "Greater Los Angeles": "America",
    "Dallas, TX": "America",
    "San Francisco": "America",
    "CA": "America",
    "Argentina": "Argentina",
    "New York": "America",
    "Abuja": "Nigeria",
    "Las Piedras, Peru": "Peru",
    "Charlestown, MA": "America",
    "Albuquerque, NM": "America",
    "Boca Raton FL 33434": "America",
    "Anaheim, CA": "America",
    "Massachusetts": "America",
    "Bay Area": "America",
    "LES, NYC": "America",
    "Birmingham, Michigan": "America",
    "Libya": "Libya",
    "mckinney, tx": "America",
    "714 to 972": "America",
    "New York, sort of!": "America",
    "Staten Island, NY": "America",
    "Washington, D.C.": "America",
    "California Love #VFL": "America",
    "San Francisco, CA": "America",
    "Annapolis, Maryland": "America",
    "USA": "America",
    "Cork.Ireland": "Ireland",
    "SF Bay Area/ Las Vegas": "America",
    "LA&OC": "America",
    "Las Vegas, NV": "America",
    "usa": "America",
    "Portland, OR": "America",
    "Harrisburg": "America",
    "Tampa": "America",
    "Houston, TX": "America",
    "San Francisco Bay Area": "America",
    "Chicago, IL, USA": "America",
    "nyc to la": "America",
    "Miami, New York, Boston": "America",
    "NYC": "America",
    "Hoops City (Memphis, TN)": "America",
    "Manchester": "UK",
    "New Jersey": "America",
    "Larne": "UK",
    "London baby": "UK",
    "Madison, NJ": "America",
    "Brighton, UK": "UK",
    "Iowa": "America",
    "[Colorado]": "America",
    "Chicago, IL": "America",
    "Rocklin, CA": "America",
    "Westerville, Ohio": "America",
    "Cleveland, OH": "America",
    "DEN": "America",
    "Dallas": "America",
    "Ottawa": "Canada",
    "North Texas, USA": "America",
    "california": "America",
    "san diego": "America",
    "Killington, Vt": "America",
    "West Hollywood, CA": "America",
    "Buffalo/Oakland/Savannah/Ire": "America",
    "London UK & USA": "UK",
    "IL": "America",
    "Indiana": "America",
    "Washington DC": "America",
    "Mexico City": "Mexico",
    "Oakland, CA": "America",
    "Long Island, NY": "America",
    "Scotland": "UK",
    "Chicago": "America",
    "New Haven, CT": "America",
    "Cali,Colombia": "Colombia",
    "East Coast, US": "America",
    "Pittsburgh, PA": "America",
    "H-town": "America",
    "Arlington, VA": "America",
    "ÜT: 37.427592,-122.116357": "America",
    "Milwaukee, WI": "America",
    "Brussels": "Belgium",
    "Cambridge, MA": "America",
    "Sheboygan": "America",
    "Dartmouth, MA": "America",
    "Houston, Texas": "America",
    "Weston super Mare": "UK",
    "Boulder, Colorado": "America",
    "Hurst, TX": "America",
    "North West of England": "UK",
    "Raleigh, NC": "America",
    "texas": "America",
    "Toronto": "Canada",
    "Vancouver": "Canada",
    "sf": "America",
    "Libertyville, IL": "America",
    "Los Angeles & New York City": "America",
    "South Pasadena, CA": "America",
    "los angeles, ca": "America",
    "San Jose, CA": "America",
    "Newport Beach, CA": "America",
    "Cambridge, UK": "UK",
    "Vietnam": "Vietnam",
    "Glasgow": "UK",
    "Mountain View, CA": "America",
    "London": "UK",
    "Calgary": "Canada",
    "Marin County, CA": "America",
    "Detroit": "America",
    "L.A.": "America",
    "Italy": "Italy",
    "Cupertino, CA": "America",
    "San Diego": "America",
    "Birmingham, England": "UK",
    "Australia": "Australia",
    "Mumbai": "India",
    "Nairobi, Kenya": "Kenya",
    "Toronto, Canada": "Canada",
    "Somerville, MA": "America",
    "Melbourne, Australia": "Australia",
    "Walnut Creek, CA": "America",
    "Paris": "France",
    "Brooklyn, NY": "America",
    "Nashville, TN": "America",
    "San Mateo, CA": "America",
    "Philly": "America",
    "Floral Park, NY": "America",
    "Kuwait": "Kuwait",
    "Sacramento, CA": "America",
    "Vancouver, BC": "Canada",
    "Northern NJ": "America",
    "Chicago / LA / NYC": "America",
    "Beijing": "China",
    "Belmont, MA": "America",
    "Wellesley, MA": "America",
    "Madison, WI": "America",
    "Vienna, VA": "America",
    "Carrollton, TX": "America",
    "Memphis, TN": "America",
    "East Rutherford, NJ": "America",
    "New York, NY": "America",
    "North Carolina, USA": "America",
    "Boston, MA": "America",
    "Pennsylvania": "America",
    "Vienna, Virginia": "America",
    "Bellevue, WA": "America",
    "Greater Chicago Area": "America",
    "Santa Monica": "America",
    "Norfolk, VA": "America",
    "NY": "America",
    "Northern California": "America",
    "NC": "America",
    "Philadelphia, PA": "America",
    "Fort Worth, TX": "America",
    "Kirkland, WA": "America",
    "Topeka, KS": "America",
    "sunnyvale, CA": "America",
    "Berkeley, CA": "America",
    "Andover, MA": "America",
    "Livermore, CA": "America",
    "Brooklyn": "America",
    "Fort Lauderdale, Florida": "America",
    "Pasadena, CA": "America",
    "Milford, Michigan": "America",
    "Woodland Hills, CA": "America",
    "Clifton, VA": "America",
    "Henderson, NV": "America",
    "MN": "America",
    "Trenton, NJ": "America",
    "Jacksonville, FL": "America",
    "STL!!": "America",
    "Palm Beach, FL": "America",
    "Evanston, Illinois": "America",
    "Metro Detroit": "America",
    "Boston, MA (Cleveland)": "America",
    "CA, USA": "America",
    "Swampscott, MA": "America",
    "Ocean City, NJ": "America",
    "Oregon": "America",
    "Washington D.C.": "America",
    "Los Angeles, California": "America",
    "Sioux Falls, SD": "America",
    "Southern California": "America",
    "Weston, CT": "America",
    "West Point, GA": "America",
    "Hollywood, CA": "America",
    "Orange County, CA": "America",
    "Austin": "America",
    "Pittsburgh": "America",
    "Beijing, China": "China",
    "London, UK": "UK",
    "City of Industry, CA": "America",
    "San Antonio, Texas": "America",
    "Philly, PA": "America",
    "Salt Lake City, UT": "America",
    "Newark, DE": "America",
    "Ocean City, MD": "America",
    "Bozeman, MT": "America",
    "Upstate NY": "America",
    "My computer screen": "Unknown",
    "Monaco, Paris, Hong Kong": "Monaco",
    "Edina, MN": "America",
    "Waltham, MA": "America",
    "St. Paul, MN": "America",
    "southfield, michigan": "America",
    "Seattle, WA": "America",
    "Yuma, AZ": "America",
    "Gulf Shores, Alabama": "America",
    "Florida": "America",
    "ÜT: 32.957923,-117.202476": "America",
    "Southern Maryland": "America",
    "Osaka, Japan": "Japan",
    "New Orleans, Louisiana": "America",
    "Leominster, MA": "America",
    "Santa Cruz, CA": "America",
    "Providence, RI": "America",
    "Saugus, MA": "America",
    "Huntington Beach, CA": "America",
    "Little Rock, AR": "America",
    "nyc": "America",
    "kansas city": "America",
    "Colorado Springs": "America",
    "Santa Barbara, CA": "America",
    "Venice Beach": "America",
    "Irvine": "America",
    "SoCal": "America",
    "Dallas/Fort Worth": "America",
    "US": "America",
    "Santa Clara, CA": "America",
    "Montreal, Quebec": "Canada",
    "Hamilton, Ontario, Canada": "Canada",
    "Phoenix, Arizona": "America",
    "Antioch, CA": "America",
    "Eugene, Oregon": "America",
    "ÜT: 33.944638,-118.402832": "America",
    "CT": "America",
    "Indianapolis": "America",
    "Malibu, CA": "America",
    "Highlands, NJ": "America",
    "dc/ny": "America",
    "Massachusetts": "America",
    "Belleville, MI": "America",
    "Boulder, CO": "America",
    "Canyon Country, California": "America",
    "Amsterdam": "Netherlands",
    "New Orleans": "America",
    "California, United States": "America",
    "Grand Blanc": "America",
    "Central Illinois": "America",
    "Santa Monica, CA": "America",
    "Portland, OR": "America",
    "Cambridge": "UK",
    "North Dakota": "America",
    "san francisco, ca": "America",
    "nein, london, or maui.": "UK",
    "east coast, us": "America",
    "washington, dc": "America",
    "vancouver, ca": "Canada",
    "sweden": "Sweden",
    "belfast/boston": "UK",
    "ocean, nj": "America",
    "fresno, ca": "America",
    "richmond, va": "America",
    "atlanta, ga & st augustine, fl": "America",
    "springfield, mo": "America",
    "new jersey, usa": "America",
    "cincinnati": "America",
    "hilton head, sc": "America",
    "elmira, ny": "America",
    "austin, texas": "America",
    "grand junction, colorado": "America",
    "clifton, nj": "America",
    "denver": "America",
    "purcellville, va": "America",
    "charleston, sc": "America",
    "mammoth lakes": "America",
    "louisville, ky": "America",
    "manassas va": "America",
    "kalamazoo & chicago": "America",
    "lehigh valley, pa": "America",
    "seattle": "America",
    "warsaw, berlin, kiev": "Poland",
    "london via adelaide": "UK",
    "socal is where my mind stays": "America",
    "dc/sf/bflo": "America",
    "raleigh": "America",
    "ottawa/st.louis": "Canada",
    "columbus, ohio": "America",
    "htx": "America",
    "irvine, ca": "America",
    "detroit, michigan": "America",
    "america's dairyland": "America",
    "san diego, ca": "America",
    "brazil": "Brazil",
    "almere, the netherlands": "Netherlands",
    "walnut creek, ca when i'm ther": "America",
    "france": "France",
    "germany": "Germany",
    "oklahoma": "America",
    "colorado": "America",
    "san francisco, ca": "America",
    "st. louis mo": "America",
    "danville ca": "America",
    "medford, ma": "America",
    "ireland": "Ireland",
    "toronto canada": "Canada",
    "buffalo, ny": "America",
    "pittsburgh": "America",
    "corpus christi": "America",
    "erie, pa": "America",
    "michigan": "America",
    "stavanger, norway": "Norway",
    "southern california and hawaii": "America",
    "quito, ecuador": "Ecuador",
    "orlando, fl": "America",
    "central nj": "America",
    "irving texas": "America",
    "alexandria, va": "America",
    "edinburgh": "UK",
    "oxford, ms": "America",
    "grimsby - uk": "UK",
    "virginia, usa": "America",
    "pdx": "America",
    "metro dc area": "America",
    "kingston, ontario": "Canada",
    "wdve pittsburgh": "America",
    "raleigh, north carolina, usa": "America",
    "guatemala": "Guatemala",
    "east coast": "America",
    "new york city": "America",
    "washington, dc.": "America",
    "boston": "America",
    "a californian in london": "UK",
    "south australia": "Australia",
    "austin, tx": "America",
    "gig harbor": "America",
    "ontario canada": "Canada",
    "yyc": "Canada",
    "cloud city, ma": "America",
    "london-manila": "UK",
    "south florida": "America",
    "virginia, usa": "America",
    "central nj": "America",
    "united states": "America",
    "neenah, wi": "America",
    "phila, pa": "America",
    "columbus oh": "America",
    "columbus, ohio": "America",
    "farmington, utah": "America",
    "singapore": "Singapore",
    "omaha, ne": "America",
    "north bend, wa": "America",
    "iowa state university": "America",
    "india ✈️ chicago ✈️ d.c. ✈️ fl": "India",
    "dallas, tx.": "America",
    "beaverton, or": "America",
    "university city, mo": "America",
    "johnson city tn": "America",
    "orlando florida. (winter park)": "America",
    "las vegas": "America",
    "mckinney, texas": "America",
    "west coast": "America",
    "sutherlin, oregon": "America",
    "la jolla, california": "America",
    "fort worth, texas": "America",
    "minnesota": "America",
    "canton, ma": "America",
    "alabama": "America",
    "detroit, michigan": "America",
    "phoenix, az": "America",
    "bay area - cali": "America",
    "maryland": "America",
    "miami": "America",
    "tri cities (tri)": "America",
    "most states in us": "America",
    "college station, tx": "America",
    "dallas fort worth": "America",
    "savannah, ga": "America",
    "saratoga springs": "America",
    "triad": "America",
    "hanover twp, pa": "America",
    "millville,nj": "America",
    "charlotte, nc": "America",
    "crofton, maryland": "America",
    "stafford va": "America",
    "washington,d.c.": "America",
    "dallas, tx": "America",
    "philadephia, pa": "America",
    "mclean, va": "America",
    "va": "America",
    "baltimore, md": "America",
    "aldie va": "America",
    "nyc // li": "America",
    "cincinnati, oh": "America",
    "carlsbad, ca": "America",
    "des moines, ia": "America",
    "terrace park oh": "America",
    "southeastern pennsylvania usa": "America",
    "north carolina": "America",
    "edmonton": "Canada",
    "wayne,pa usa": "America",
    "windermere, florida": "America",
    "wchob, buffalo, ny": "America",
    "madbury, nh": "America",
    "orange, ca": "America",
    "leesburg, va": "America",
    "livonia, mi": "America",
    "windermere (seattle)": "America",
    "wexford, pa": "America",
    "sequim, wa": "America",
    "nürnberg, germany": "Germany",
    "nashville via minnesota": "America",
    "russia": "Russia",
    "knoxville, tn": "America",
    "neenah, wi": "America",
    "mckinney tx": "America",
    "orlando": "America",
    "philadelphia usa": "America",
    "south carolina": "America",
    "asheville, nc": "America",
    "london": "UK",
    "portland, maine": "America",
    "queens, new york": "America",
    "san jose , ca": "America",
    "lawrence, ma": "America",
    "lowell, ma": "America",
    "detroit, mi": "America",
    "okinawa, japan": "Japan",
    "milwaukee, wi": "America",
    "jupiter, fl": "America",
    "virginia beach": "America",
    "mission, kansas": "America",
    "maine": "America",
    "brighton": "UK",
    "liverpool": "UK",
    "san antonio, republic of texas": "America",
    "miniapple(s)": "America",
    "plano, texas": "America",
    "euless, texas": "America",
    "lake arrowhead": "America",
    "largo florida": "America",
    "greater boston area": "America",
    "northern ireland": "UK",
    "waynesville, ohio": "America",
    "new delhi": "India",
    "north hollywood": "America",
    "greenbow, alabama": "America",
    "college station": "America",
    "arlington va": "America",
    "mexico df": "Mexico",
    "seattle, wa, usa": "America",
    "lake county, illinois": "America",
    "charlotte,nc": "America",
    "winterville nc": "America",
    "dallas, or sometimes detroit": "America",
    "tampa, florida": "America",
    "brooklyn to across the globe": "America",
    "washington, d.c": "America",
    "dublin, ireland": "Ireland",
    "san marcos,ca": "America",
    "chapel hill, nc": "America",
    "austin, tx.": "America",
    "greater geelong": "Australia",
    "hampton roads": "America",
    "jacksonville florida": "America",
    "montgomery al": "America",
    "salt lake city, usa": "America",
    "omaha": "America",
    "windermere (seattle)": "America",
    "midlothian, tx": "America",
    "santo domingo": "Dominican Republic",
    "waco, texas": "America",
    "new orleans, la": "America",
    "cape cod": "America",
    "san antonio, tx": "America",
    "el paso, tx": "America",
    "ann arbor, mi": "America",
    "saint paul": "America",
    "knoxville, tn": "America",
    "dallas, texas": "America",
    "natchitoches, la": "America",
    "glendale, arizona": "America",
    "atx": "America",
    "st paul, minnesota": "America",
    "sarasota, fl": "America",
    "bentonville, arkansas": "America",
    "indianapolis, in": "America",
    "brooklyn by way of chicago": "America",
    "wichita falls, texas": "America",
    "illinos": "America",
    "lafayette, la": "America",
    "dallas, texas": "America",
    "sloop": "Unknown",
    "lost boys, neverland": "Unknown",
    "ig; tannersayre": "Unknown",
    "here. but i want to be there.": "Unknown",
    "the greatest city in the world": "Unknown",
    "hertz's couch": "Unknown",
    "somewhere east": "Unknown",
    "trying to go everywhere!": "Unknown",
    "970 colorado": "America",
    "in the kitchen": "Unknown",
    "webster groves, mo": "America",
    "pilot point, republic of texas": "America",
    "chelmsford, ma": "America",
    "nigeria,lagos": "Nigeria"
}

tweet_location_dic = {
    key.lower(): value for key, value in tweet_location_dic.items()
}

### Data source

In [54]:
df = pd.read_csv('Tweets.csv')

### Location normalization

In [55]:
df['tweet_location'] = df['tweet_location'].str.lower()
df['tweet_location_normalized'] = df['tweet_location'].map(tweet_location_dic)

df['normalized_location'] = df['user_timezone'].map(user_timezone_dic)
df['normalized_location'] = df['normalized_location'].fillna(df['tweet_location_normalized'])

df['tweet_location'] = df['normalized_location']

df.drop(columns=['normalized_location', 'tweet_location_normalized'], inplace=True)

### Output

In [56]:
df.to_csv('output_tweets.csv', index=False)