In [1]:
import pandas as pd
import numpy as np
import warnings

import seaborn as sns
import matplotlib.pyplot as plt

#Plotly Libraris
import plotly.express as px
import plotly.graph_objects as go
import plotly.figure_factory as ff
from plotly.colors import n_colors
from plotly.subplots import make_subplots
import plotly.io as pio



warnings.filterwarnings('ignore')

pio.templates.default = "ggplot2"

#dataframe display settings
pd.set_option('display.max_columns', 5000000)
pd.set_option('display.max_rows', 50000000)

In [2]:
## Data from dataset 3
industry_trends = pd.read_csv('data/dataset3.csv')
industry_trends.rename(columns={"Unnamed: 0": "StartupID", "Unnamed: 6": "City_ZIP"}, inplace=True)
## Data from dataset 4
startup_info = pd.read_csv('data/dataset4.csv')


In [3]:
startup_info['founded_year'] = pd.to_datetime(startup_info['founded_at'], errors = 'coerce').dt.year
startup_info['funding_total_usd'].replace('-', 0, inplace=True)
startup_info['funding_total_usd'] = startup_info['funding_total_usd'].astype(float)
startup_info = startup_info.drop_duplicates()

# Cleanning dataset
clean_startup_info = startup_info.drop(['permalink', 'homepage_url'], axis=1)

# Remove the NaN name
clean_startup_info.dropna(how='any', subset=['name'], axis=0, inplace=True)

#Extracting year value from "first_funding_at" and changing to int
clean_startup_info['first_funding_at'] = clean_startup_info.first_funding_at.str.split("-").str[0]
clean_startup_info['first_funding_at'] = clean_startup_info['first_funding_at'].astype(float)
#Extracting year value from "last_funding_at" and changing to int
clean_startup_info['last_funding_at'] = clean_startup_info.last_funding_at.str.split("-").str[0]
clean_startup_info['last_funding_at'] = clean_startup_info['last_funding_at'].astype(float)

# Treat Nan category
clean_startup_info['category_list'] = clean_startup_info['category_list'].replace(np.nan, 'other')
clean_startup_info.head()

Unnamed: 0,name,category_list,funding_total_usd,status,country_code,state_code,region,city,funding_rounds,founded_at,first_funding_at,last_funding_at,founded_year
0,#fame,Media,10000000.0,operating,IND,16,Mumbai,Mumbai,1,,2015.0,2015.0,
1,:Qounter,Application Platforms|Real Time|Social Network...,700000.0,operating,USA,DE,DE - Other,Delaware City,2,2014-09-04,2014.0,2014.0,2014.0
2,"(THE) ONE of THEM,Inc.",Apps|Games|Mobile,3406878.0,operating,,,,,1,,2014.0,2014.0,
3,0-6.com,Curated Web,2000000.0,operating,CHN,22,Beijing,Beijing,1,2007-01-01,2008.0,2008.0,2007.0
4,004 Technologies,Software,0.0,operating,USA,IL,"Springfield, Illinois",Champaign,1,2010-01-01,2014.0,2014.0,2010.0


In [4]:
corr_startups = clean_startup_info[clean_startup_info['status'] != 'ipo']
corr_startups.reset_index(drop=True, inplace=True)
corr_startups['is_successful'] = corr_startups['status'].apply(lambda x: 1 if x in ['operating', 'acquired'] else 0)

corr_startups.columns


Index(['name', 'category_list', 'funding_total_usd', 'status', 'country_code',
       'state_code', 'region', 'city', 'funding_rounds', 'founded_at',
       'first_funding_at', 'last_funding_at', 'founded_year', 'is_successful'],
      dtype='object')

In [5]:
# Split the 'category_list' column by '|' and create dummy variables
categories_dummy = corr_startups['category_list'].str.get_dummies(sep='|')


In [6]:
# One-hot encode 'country_code' and 'city' columns
country_dummy = pd.get_dummies(corr_startups['country_code'], prefix='country')

# Concatenate the dummy variables with the DataFrame
encoded_corr = pd.concat([corr_startups, categories_dummy, country_dummy], axis=1)
encoded_corr.head(3)


Unnamed: 0,name,category_list,funding_total_usd,status,country_code,state_code,region,city,funding_rounds,founded_at,first_funding_at,last_funding_at,founded_year,is_successful,3D,3D Printing,3D Technology,Accounting,Active Lifestyle,Ad Targeting,Adaptive Equipment,Advanced Materials,Adventure Travel,Advertising,Advertising Exchanges,Advertising Networks,Advertising Platforms,Advice,Aerospace,Agriculture,Air Pollution Control,Algorithms,All Markets,All Students,Alternative Medicine,Alumni,Analytics,Android,Angels,Animal Feed,Anything Capital Intensive,App Discovery,App Marketing,App Stores,Application Performance Monitoring,Application Platforms,Apps,Aquaculture,Architecture,Archiving,Art,Artificial Intelligence,Artists Globally,Assisitive Technology,Assisted Living,Auctions,Audio,Audiobooks,Augmented Reality,Auto,Automated Kiosk,Automotive,B2B,B2B Express Delivery,BPO Services,Babies,Baby Accessories,Baby Boomers,Baby Safety,Banking,Batteries,Beauty,Bicycles,Big Data,Big Data Analytics,Billing,Bio-Pharm,Biofuels,Bioinformatics,Biomass Power Generation,Biometrics,Biotechnology,Biotechnology and Semiconductor,Bitcoin,Blogging Platforms,Boating Industry,Brand Marketing,Brewing,Bridging Online and Offline,Broadcasting,Brokers,Browser Extensions,Building Owners,Building Products,Business Analytics,Business Development,Business Information Systems,Business Intelligence,Business Productivity,Business Services,Business Travelers,CAD,CRM,Cable,Call Center Automation,Cannabis,Carbon,Career Management,Career Planning,Cars,Casual Games,Cause Marketing,Celebrity,Certification Test,Charities,Charity,Charter Schools,Chat,Chemicals,Child Care,China Internet,Civil Engineers,Classifieds,Clean Energy,Clean Technology,Clean Technology IT,Clinical Trials,Cloud Computing,Cloud Data Services,Cloud Gaming,Cloud Infrastructure,Cloud Management,Cloud Security,Cloud-Based Music,Coffee,Collaboration,Collaborative Consumption,Collectibles,College Campuses,College Recruiting,Colleges,Comics,Commercial Real Estate,Commercial Solar,Commodities,Communications Hardware,Communications Infrastructure,Communities,Comparison Shopping,Computer Vision,Computers,Concentrated Solar Power,Concerts,Console Gaming,Construction,Consulting,Consumer Behavior,Consumer Electronics,Consumer Goods,Consumer Internet,Consumer Lending,Consumers,Contact Centers,Contact Management,Content,Content Creators,Content Delivery,Content Discovery,Content Syndication,Contests,Cooking,Corporate IT,Corporate Training,Corporate Wellness,Cosmetic Surgery,Cosmetics,Coupons,Coworking,Craft Beer,Creative,Creative Industries,Credit,Credit Cards,Crowdfunding,Crowdsourcing,Cryptocurrency,Curated Web,Custom Retail,Customer Service,Customer Support Tools,Cyber,Cyber Security,DIY,DOD/Military,Darknet,Data Center Automation,Data Center Infrastructure,Data Centers,Data Integration,Data Mining,Data Privacy,Data Security,Data Visualization,Databases,Debt Collecting,Deep Information Technology,Defense,Delivery,Demographies,Dental,Design,Designers,Developer APIs,Developer Tools,Development Platforms,Diabetes,Diagnostics,Dietary Supplements,Digital Entertainment,Digital Media,Digital Rights Management,Digital Signage,Direct Advertising,Direct Marketing,Direct Sales,Discounts,Displays,Disruptive Models,Distribution,Distributors,Diving,Doctors,Document Management,Domains,Drones,E-Books,E-Commerce,E-Commerce Platforms,EBooks,EDA Tools,Early Stage IT,Early-Stage Technology,East Africa,EdTech,Ediscovery,Education,Educational Games,Edutainment,Elder Care,Elderly,Electric Vehicles,Electrical Distribution,Electronic Health Records,Electronics,Email,Email Marketing,Email Newsletters,Embedded Hardware and Software,Emerging Markets,Employer Benefits Programs,Employment,Energy,Energy Efficiency,Energy IT,Energy Management,Energy Storage,Engineering Firms,English-Speaking,Enterprise 2.0,Enterprise Application,Enterprise Hardware,Enterprise Purchasing,Enterprise Resource Planning,Enterprise Search,Enterprise Security,Enterprise Software,Enterprises,Entertainment,Entertainment Industry,Entrepreneur,Environmental Innovation,Estimation and Quoting,Event Management,Events,Exercise,Experience Design,Eyewear,FPGA,Face Recognition,Facebook Applications,Families,Fantasy Sports,Farmers Market,Farming,Fashion,Fertility,Field Support Services,File Sharing,Film,Film Distribution,Film Production,FinTech,Finance,Finance Technology,Financial Exchanges,Financial Services,First Aid,Fitness,Flash Sales,Flash Storage,Fleet Management,Flowers,Fmcg,Food Processing,Forums,Franchises,Fraud Detection,Freelancers,Freemium,FreetoPlay Gaming,Fruit,Fuel Cells,Fuels,Funeral Industry,Furniture,Gadget,Gambling,Game,Game Mechanics,Games,Gamification,Gas,Gay & Lesbian,General Public Worldwide,Generation Y-Z,Genetic Testing,Geospatial,Gift Card,Gift Exchange,Gift Registries,Gold,Golf Equipment,Google Apps,Google Glass,Governance,Government Innovation,Governments,Gps,Graphic Design,Graphics,Green,Green Building,Green Consumer Goods,GreenTech,Groceries,Group Buying,Group Email,Group SMS,Guide to Nightlife,Guides,HDTV,Handmade,Hardware,Hardware + Software,Health Care,Health Care Information Technology,Health Diagnostics,Health Services Industry,Health and Insurance,Health and Wellness,Healthcare Services,Heavy Industry,Hedge Funds,Hi Tech,High School Students,High Schools,High Tech,Hip Hop,Home & Garden,Home Automation,Home Decor,Home Owners,Home Renovation,Homeland Security,Homeless Shelter,Hospitality,Hospitals,Hotels,Human Computer Interaction,Human Resource Automation,Human Resources,Humanitarian,Hunting Industry,ICT,IT Management,IT and Cybersecurity,IaaS,Identity,Identity Management,Image Recognition,Impact Investing,In-Flight Entertainment,Incentives,Incubators,Independent Music,Independent Music Labels,Independent Pharmacies,Indians,Indoor Positioning,Industrial,Industrial Automation,Industrial Energy Efficiency,Information Security,Information Services,Information Technology,Infrastructure,Infrastructure Builders,Innovation Engineering,Innovation Management,Insurance,Insurance Companies,Intellectual Asset Management,Intellectual Property,Intelligent Systems,Interest Graph,Interface Design,Interior Design,Internet,Internet Infrastructure,Internet Marketing,Internet Radio Market,Internet Service Providers,Internet TV,Internet Technology,Internet of Things,Invention,Investment Management,Jewelry,Journalism,K-12 Education,Kids,Kinect,Knowledge Management,Labor Optimization,Landscaping,Language Learning,Lasers,Law Enforcement,Lead Generation,Lead Management,Legal,Leisure,Licensing,Life Sciences,Lifestyle,Lifestyle Businesses,Lifestyle Products,Lighting,Limousines,Lingerie,Linux,Local,Local Advertising,Local Based Services,Local Businesses,Local Commerce,Local Coupons,Local Search,Local Services,Location Based Services,Logistics,Logistics Company,Lotteries,Low Bid Auctions,Loyalty Programs,M2M,MMO Games,Mac,Machine Learning,Made in Italy,Manufacturing,Maps,Market Research,Marketing Automation,Marketplaces,Mass Customization,Match-Making,Material Science,Mechanical Solutions,Media,Medical,Medical Devices,Medical Professionals,Medication Adherence,Meeting Software,Mens Specific,Messaging,Micro-Enterprises,MicroBlogging,Minerals,Mining Technologies,Mobile,Mobile Advertising,Mobile Analytics,Mobile Commerce,Mobile Coupons,Mobile Devices,Mobile Emergency&Health,Mobile Enterprise,Mobile Games,Mobile Health,Mobile Infrastructure,Mobile Payments,Mobile Search,Mobile Security,Mobile Shopping,Mobile Social,Mobile Software Tools,Mobile Video,Mobility,Monetization,Moneymaking,Mothers,Motion Capture,Motors,Multi-level Marketing,Music,Music Education,Music Services,Music Venues,Musical Instruments,Musicians,NFC,Nanotechnology,Natural Gas Uses,Natural Language Processing,Natural Resources,Navigation,Network Security,Networking,Neuroscience,New Product Development,New Technologies,News,Niche Specific,Nightclubs,Nightlife,Non Profit,Non-Tech,Nonprofits,Notebooks,Nutraceutical,Nutrition,Office Space,Offline Businesses,Oil,Oil & Gas,Oil and Gas,Online Auctions,Online Dating,Online Education,Online Gaming,Online Identity,Online Rental,Online Reservations,Online Scheduling,Online Shopping,Online Travel,Online Video Advertising,Open Source,Operating Systems,Opinions,Optical Communications,Optimization,Organic,Organic Food,Outdoor Advertising,Outdoors,Outsourcing,P2P Money Transfer,PC Gaming,PaaS,Parenting,Parking,Payments,Peer-to-Peer,Performance Marketing,Performing Arts,Personal Branding,Personal Data,Personal Finance,Personal Health,Personalization,Pervasive Computing,Pets,Pharmaceuticals,Photo Editing,Photo Sharing,Photography,Physical Security,Physicians,Plumbers,Podcast,Point of Sale,Politics,Polling,Portals,Postal and Courier Services,Pre Seed,Prediction Markets,Predictive Analytics,Presentations,Price Comparison,Printing,Privacy,Private Corrections,Private School,Private Social Networking,Procurement,Product Design,Product Development Services,Product Search,Productivity,Productivity Software,Professional Networking,Professional Services,Project Management,Promotional,Property Management,Proximity Internet,Psychology,Public Relations,Public Safety,Public Transportation,Publishing,Q&A,QR Codes,Quantified Self,Quantitative Marketing,RFID,RIM,Racing,Radical Breakthrough Startups,Rapidly Expanding,Reading Apps,Real Estate,Real Estate Investors,Real Time,Realtors,Recipes,Recreation,Recruiting,Recycling,Registrars,Rehabilitation,Religion,Remediation,Renewable Energies,Renewable Tech,Rental Housing,Reputation,Residential Solar,Resorts,Restaurants,Retail,Retail Technology,Retirement,Reviews and Recommendations,Ride Sharing,Risk Management,Robotics,Rural Energy,SEO,SMS,SNS,SaaS,Sailing Community,Sales Automation,Sales and Marketing,Salesforce Killers,Search,Search Marketing,Security,Self Development,Self Storage,Semantic Search,Semantic Web,Semiconductor Manufacturing Equipment,Semiconductors,Senior Citizens,Senior Health,Sensors,Serious Games,Service Industries,Service Providers,Services,Sex Industry,SexTech,Shared Services,Shipping,Shipping Broker Industry,Shoes,Shopping,Simulation,Skate Wear,Skill Assessment,Skill Gaming,Small and Medium Businesses,Smart Building,Smart Grid,Soccer,Social + Mobile + Local,Social Activists,Social Bookmarking,Social Business,Social Buying,Social CRM,Social Commerce,Social Entrepreneurship,Social Fundraising,Social Games,Social Innovation,Social Investing,Social Media,Social Media Advertising,Social Media Agent,Social Media Management,Social Media Marketing,Social Media Monitoring,Social Media Platforms,Social Network Media,Social News,Social Opinion Platform,Social Recruiting,Social Search,Social Television,Social Travel,Software,Software Compliance,Solar,South East Asia,Space Travel,Spam Filtering,Spas,Specialty Chemicals,Specialty Foods,Specialty Retail,Speech Recognition,Sponsorship,Sporting Goods,Sports,Sports Stadiums,Staffing Firms,Startup Histrionics,Startups,Stock Exchanges,Storage,Subscription Businesses,Subscription Service,Sunglasses,Supply Chain Management,Surfing Community,Surveys,Sustainability,Swimming,Synchronization,Systems,TV Production,TV Station,Tablets,Task Management,Taxis,Tea,Teachers,Teaching STEM Concepts,Tech Field Support,Technical Continuing Education,Technology,Teenagers,Telecommunications,Telephony,Television,Temporary Staffing,Test and Measurement,Testing,Text Analytics,Textbooks,Textiles,Theatre,Therapeutics,Ticketing,Timeshares,Tourism,Toys,Tracking,Trading,Training,Transaction Processing,Translation,Transportation,Travel,Travel & Tourism,Trusted Networks,Tutoring,Twin-Tip Skis,Twitter Applications,UV LEDs,Underserved Children,Unifed Communications,Universities,University Students,Unmanned Air Systems,Usability,User Experience Design,User Interface,User Testing,Utilities,Utility Land Vehicles,Vacation Rentals,Vending and Concessions,Venture Capital,Ventures for Good,Vertical Search,Veterinary,Video,Video Chat,Video Conferencing,Video Editing,Video Game Tournaments,Video Games,Video Processing,Video Streaming,Video on Demand,Virtual Currency,Virtual Desktop,Virtual Goods,Virtual Workforces,Virtual Worlds,Virtualization,Visual Search,Visualization,VoIP,Vulnerability Management,Waste Management,Watch,Water,Water Purification,Wealth Management,Wearables,Web Browsers,Web CMS,Web Design,Web Development,Web Hosting,Web Presence Management,Web Tools,WebOS,Weddings,West Africa,Wholesale,Wind,Windows Phone 7,Wine And Spirits,Wireless,Women,Writers,Young Adults,iOS,iPad,iPhone,iPod Touch,mHealth,other,country_ALB,country_ARE,country_ARG,country_ARM,country_AUS,country_AUT,country_AZE,country_BAH,country_BEL,country_BGD,country_BGR,country_BHR,country_BLM,country_BLR,country_BLZ,country_BMU,country_BRA,country_BRB,country_BRN,country_BWA,country_CAN,country_CHE,country_CHL,country_CHN,country_CIV,country_CMR,country_COL,country_CRI,country_CYM,country_CYP,country_CZE,country_DEU,country_DMA,country_DNK,country_DOM,country_DZA,country_ECU,country_EGY,country_ESP,country_EST,country_FIN,country_FRA,country_GBR,country_GEO,country_GGY,country_GHA,country_GIB,country_GRC,country_GRD,country_GTM,country_HKG,country_HND,country_HRV,country_HUN,country_IDN,country_IND,country_IRL,country_IRN,country_ISL,country_ISR,country_ITA,country_JAM,country_JEY,country_JOR,country_JPN,country_KAZ,country_KEN,country_KHM,country_KNA,country_KOR,country_KWT,country_LAO,country_LBN,country_LIE,country_LKA,country_LTU,country_LUX,country_LVA,country_MAF,country_MAR,country_MCO,country_MDA,country_MEX,country_MKD,country_MLT,country_MMR,country_MNE,country_MOZ,country_MUS,country_MYS,country_NGA,country_NIC,country_NLD,country_NOR,country_NPL,country_NZL,country_OMN,country_PAK,country_PAN,country_PER,country_PHL,country_POL,country_PRI,country_PRT,country_PRY,country_PSE,country_QAT,country_ROM,country_RUS,country_RWA,country_SAU,country_SEN,country_SGP,country_SLV,country_SOM,country_SRB,country_SVK,country_SVN,country_SWE,country_SYC,country_TAN,country_TGO,country_THA,country_TTO,country_TUN,country_TUR,country_TWN,country_UGA,country_UKR,country_URY,country_USA,country_UZB,country_VEN,country_VNM,country_ZAF,country_ZMB,country_ZWE
0,#fame,Media,10000000.0,operating,IND,16,Mumbai,Mumbai,1,,2015.0,2015.0,,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
1,:Qounter,Application Platforms|Real Time|Social Network...,700000.0,operating,USA,DE,DE - Other,Delaware City,2,2014-09-04,2014.0,2014.0,2014.0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0
2,"(THE) ONE of THEM,Inc.",Apps|Games|Mobile,3406878.0,operating,,,,,1,,2014.0,2014.0,,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0


In [2]:
# Calculate the correlation matrix
correlation_matrix = encoded_corr.corr()

# Plot the correlation matrix
plt.figure(figsize=(12, 10))
sns.heatmap(correlation_matrix[['is_successful']].sort_values(by='is_successful', ascending=False),
            annot=True, cmap='coolwarm', fmt=".2f", annot_kws={"size": 10})
plt.title('Correlation with is_successful')
plt.show()


NameError: name 'encoded_corr' is not defined

In [1]:
correlation_matrix[['is_successful']].sort_values(by='is_successful', ascending=False)

NameError: name 'correlation_matrix' is not defined