# The Indian Start-up Ecosytem

### Installations

In [1281]:
# %pip install seaborn
# %pip install plotly --upgrade

### Importation

In [1282]:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
from scipy import stats

import plotly.express as px

### Load Data

In [1283]:
data_2018 =  pd.read_csv('data/startup_funding2018.csv')
data_2019 =  pd.read_csv('data/startup_funding2019.csv')
data_2020 =  pd.read_csv('data/startup_funding2020.csv')
data_2021 =  pd.read_csv('data/startup_funding2021.csv')

In [1284]:
data_2018['Amount'].isna().sum()

0

### Exploratory Data Analysis

In [1285]:
data_2018.columns

Index(['Company Name', 'Industry', 'Round/Series', 'Amount', 'Location',
       'About Company'],
      dtype='object')

In [1286]:
data_2018.rename(columns={
    'Company Name':'Company/Brand',
    'Industry':'Sector',
    'About Company':'What it does',
    'Amount':'Amount($)',
    'Location':'HeadQuarter',
    'Round/Series':'Stage',
}, inplace=True)

In [1287]:
data_2018.columns

Index(['Company/Brand', 'Sector', 'Stage', 'Amount($)', 'HeadQuarter',
       'What it does'],
      dtype='object')

In [1288]:
data_2018.head()

Unnamed: 0,Company/Brand,Sector,Stage,Amount($),HeadQuarter,What it does
0,TheCollegeFever,"Brand Marketing, Event Promotion, Marketing, S...",Seed,250000,"Bangalore, Karnataka, India","TheCollegeFever is a hub for fun, fiesta and f..."
1,Happy Cow Dairy,"Agriculture, Farming",Seed,"₹40,000,000","Mumbai, Maharashtra, India",A startup which aggregates milk from dairy far...
2,MyLoanCare,"Credit, Financial Services, Lending, Marketplace",Series A,"₹65,000,000","Gurgaon, Haryana, India",Leading Online Loans Marketplace in India
3,PayMe India,"Financial Services, FinTech",Angel,2000000,"Noida, Uttar Pradesh, India",PayMe India is an innovative FinTech organizat...
4,Eunimart,"E-Commerce Platforms, Retail, SaaS",Seed,—,"Hyderabad, Andhra Pradesh, India",Eunimart is a one stop solution for merchants ...


In [1289]:
data_2018['Founders'] = 'Unknown'
data_2018['Investor'] = 'Unknown'
data_2018

Unnamed: 0,Company/Brand,Sector,Stage,Amount($),HeadQuarter,What it does,Founders,Investor
0,TheCollegeFever,"Brand Marketing, Event Promotion, Marketing, S...",Seed,250000,"Bangalore, Karnataka, India","TheCollegeFever is a hub for fun, fiesta and f...",Unknown,Unknown
1,Happy Cow Dairy,"Agriculture, Farming",Seed,"₹40,000,000","Mumbai, Maharashtra, India",A startup which aggregates milk from dairy far...,Unknown,Unknown
2,MyLoanCare,"Credit, Financial Services, Lending, Marketplace",Series A,"₹65,000,000","Gurgaon, Haryana, India",Leading Online Loans Marketplace in India,Unknown,Unknown
3,PayMe India,"Financial Services, FinTech",Angel,2000000,"Noida, Uttar Pradesh, India",PayMe India is an innovative FinTech organizat...,Unknown,Unknown
4,Eunimart,"E-Commerce Platforms, Retail, SaaS",Seed,—,"Hyderabad, Andhra Pradesh, India",Eunimart is a one stop solution for merchants ...,Unknown,Unknown
...,...,...,...,...,...,...,...,...
521,Udaan,"B2B, Business Development, Internet, Marketplace",Series C,225000000,"Bangalore, Karnataka, India","Udaan is a B2B trade platform, designed specif...",Unknown,Unknown
522,Happyeasygo Group,"Tourism, Travel",Series A,—,"Haryana, Haryana, India",HappyEasyGo is an online travel domain.,Unknown,Unknown
523,Mombay,"Food and Beverage, Food Delivery, Internet",Seed,7500,"Mumbai, Maharashtra, India",Mombay is a unique opportunity for housewives ...,Unknown,Unknown
524,Droni Tech,Information Technology,Seed,"₹35,000,000","Mumbai, Maharashtra, India",Droni Tech manufacture UAVs and develop softwa...,Unknown,Unknown


In [1290]:
data_2018.columns

Index(['Company/Brand', 'Sector', 'Stage', 'Amount($)', 'HeadQuarter',
       'What it does', 'Founders', 'Investor'],
      dtype='object')

In [1291]:
data_2019.drop(columns='Founded', inplace=True)
data_2019.head()

Unnamed: 0,Company/Brand,HeadQuarter,Sector,What it does,Founders,Investor,Amount($),Stage
0,Bombay Shaving,,Ecommerce,Provides a range of male grooming products,Shantanu Deshpande,Sixth Sense Ventures,"$6,300,000",
1,Ruangguru,Mumbai,Edtech,A learning platform that provides topic-based ...,"Adamas Belva Syah Devara, Iman Usman.",General Atlantic,"$150,000,000",Series C
2,Eduisfun,Mumbai,Edtech,It aims to make learning fun via games.,Jatin Solanki,"Deepak Parekh, Amitabh Bachchan, Piyush Pandey","$28,000,000",Fresh funding
3,HomeLane,Chennai,Interior design,Provides interior designing solutions,"Srikanth Iyer, Rama Harinath","Evolvence India Fund (EIF), Pidilite Group, FJ...","$30,000,000",Series D
4,Nu Genes,Telangana,AgriTech,"It is a seed company engaged in production, pr...",Narayana Reddy Punyala,Innovation in Food and Agriculture (IFA),"$6,000,000",


In [1292]:
data_2019.columns

Index(['Company/Brand', 'HeadQuarter', 'Sector', 'What it does', 'Founders',
       'Investor', 'Amount($)', 'Stage'],
      dtype='object')

In [1293]:
data_2020.drop(columns=['Founded', 'Unnamed: 9'], inplace=True)
data_2020.columns

Index(['Company/Brand', 'HeadQuarter', 'Sector', 'What it does', 'Founders',
       'Investor', 'Amount($)', 'Stage'],
      dtype='object')

In [1294]:
data_2021.drop(columns='Founded', inplace=True)
data_2021.columns

Index(['Company/Brand', 'HeadQuarter', 'Sector', 'What it does', 'Founders',
       'Investor', 'Amount($)', 'Stage'],
      dtype='object')

In [1295]:
data_2018['Amount($)'] = data_2018['Amount($)'].str.strip()
data_2018['Amount($)'] = data_2018['Amount($)'].apply(lambda x: str(x).replace(',', ''))
data_2018['Original Currency'] = data_2018['Amount($)'].apply(lambda x: 'Rupees' if '₹' in x or ('$' not in x and len(x) > 8) else 'Dollars')
data_2018.head()


Unnamed: 0,Company/Brand,Sector,Stage,Amount($),HeadQuarter,What it does,Founders,Investor,Original Currency
0,TheCollegeFever,"Brand Marketing, Event Promotion, Marketing, S...",Seed,250000,"Bangalore, Karnataka, India","TheCollegeFever is a hub for fun, fiesta and f...",Unknown,Unknown,Dollars
1,Happy Cow Dairy,"Agriculture, Farming",Seed,₹40000000,"Mumbai, Maharashtra, India",A startup which aggregates milk from dairy far...,Unknown,Unknown,Rupees
2,MyLoanCare,"Credit, Financial Services, Lending, Marketplace",Series A,₹65000000,"Gurgaon, Haryana, India",Leading Online Loans Marketplace in India,Unknown,Unknown,Rupees
3,PayMe India,"Financial Services, FinTech",Angel,2000000,"Noida, Uttar Pradesh, India",PayMe India is an innovative FinTech organizat...,Unknown,Unknown,Dollars
4,Eunimart,"E-Commerce Platforms, Retail, SaaS",Seed,—,"Hyderabad, Andhra Pradesh, India",Eunimart is a one stop solution for merchants ...,Unknown,Unknown,Dollars


#### Striping all non-numeric values from the Amount column (i.e. ₹, $) and converting to float

In [1296]:
data_2018['Amount($)'] = data_2018['Amount($)'].apply(lambda x: str(x).replace('₹', ''))
data_2018['Amount($)'] = data_2018['Amount($)'].apply(lambda x: str(x).replace('—', '0'))
data_2018['Amount($)'] = data_2018['Amount($)'].apply(lambda x: str(x).replace('$', ""))
data_2018['Amount($)'] = data_2018['Amount($)'].astype(float)
data_2018.head()

Unnamed: 0,Company/Brand,Sector,Stage,Amount($),HeadQuarter,What it does,Founders,Investor,Original Currency
0,TheCollegeFever,"Brand Marketing, Event Promotion, Marketing, S...",Seed,250000.0,"Bangalore, Karnataka, India","TheCollegeFever is a hub for fun, fiesta and f...",Unknown,Unknown,Dollars
1,Happy Cow Dairy,"Agriculture, Farming",Seed,40000000.0,"Mumbai, Maharashtra, India",A startup which aggregates milk from dairy far...,Unknown,Unknown,Rupees
2,MyLoanCare,"Credit, Financial Services, Lending, Marketplace",Series A,65000000.0,"Gurgaon, Haryana, India",Leading Online Loans Marketplace in India,Unknown,Unknown,Rupees
3,PayMe India,"Financial Services, FinTech",Angel,2000000.0,"Noida, Uttar Pradesh, India",PayMe India is an innovative FinTech organizat...,Unknown,Unknown,Dollars
4,Eunimart,"E-Commerce Platforms, Retail, SaaS",Seed,0.0,"Hyderabad, Andhra Pradesh, India",Eunimart is a one stop solution for merchants ...,Unknown,Unknown,Dollars


#### Now let's convert the values in the amount columns that were tracked as rupee to dollars and delete the 'original currency' column. It has served its purpose

#### Asumptions

1. Each value in the amount column if it has a symbol, belongs to that currency
2. If value has no symbol and length of value - symbol > 8, then that value is in Rupees
3. Conversion rate been used is middle of the year 30th June 2018 

In [1297]:
exchange_rate = 0.0146
condition1 = data_2018['Original Currency'] == 'Rupees'
data_2018.loc[condition1, 'Amount($)'] = data_2018.loc[condition1, 'Amount($)'] * exchange_rate

data_2018

Unnamed: 0,Company/Brand,Sector,Stage,Amount($),HeadQuarter,What it does,Founders,Investor,Original Currency
0,TheCollegeFever,"Brand Marketing, Event Promotion, Marketing, S...",Seed,250000.0,"Bangalore, Karnataka, India","TheCollegeFever is a hub for fun, fiesta and f...",Unknown,Unknown,Dollars
1,Happy Cow Dairy,"Agriculture, Farming",Seed,584000.0,"Mumbai, Maharashtra, India",A startup which aggregates milk from dairy far...,Unknown,Unknown,Rupees
2,MyLoanCare,"Credit, Financial Services, Lending, Marketplace",Series A,949000.0,"Gurgaon, Haryana, India",Leading Online Loans Marketplace in India,Unknown,Unknown,Rupees
3,PayMe India,"Financial Services, FinTech",Angel,2000000.0,"Noida, Uttar Pradesh, India",PayMe India is an innovative FinTech organizat...,Unknown,Unknown,Dollars
4,Eunimart,"E-Commerce Platforms, Retail, SaaS",Seed,0.0,"Hyderabad, Andhra Pradesh, India",Eunimart is a one stop solution for merchants ...,Unknown,Unknown,Dollars
...,...,...,...,...,...,...,...,...,...
521,Udaan,"B2B, Business Development, Internet, Marketplace",Series C,3285000.0,"Bangalore, Karnataka, India","Udaan is a B2B trade platform, designed specif...",Unknown,Unknown,Rupees
522,Happyeasygo Group,"Tourism, Travel",Series A,0.0,"Haryana, Haryana, India",HappyEasyGo is an online travel domain.,Unknown,Unknown,Dollars
523,Mombay,"Food and Beverage, Food Delivery, Internet",Seed,7500.0,"Mumbai, Maharashtra, India",Mombay is a unique opportunity for housewives ...,Unknown,Unknown,Dollars
524,Droni Tech,Information Technology,Seed,511000.0,"Mumbai, Maharashtra, India",Droni Tech manufacture UAVs and develop softwa...,Unknown,Unknown,Rupees


In [1298]:
data_2018.drop(columns='Original Currency', inplace=True)

In [1299]:
# lets simplify sectors since there are too many of them to deduce meaningful insights

data_2018['Sector'].unique()

array(['Brand Marketing, Event Promotion, Marketing, Sponsorship, Ticketing',
       'Agriculture, Farming',
       'Credit, Financial Services, Lending, Marketplace',
       'Financial Services, FinTech',
       'E-Commerce Platforms, Retail, SaaS',
       'Cloud Infrastructure, PaaS, SaaS',
       'Internet, Leisure, Marketplace', 'Market Research',
       'Information Services, Information Technology', 'Mobile Payments',
       'B2B, Shoes', 'Internet',
       'Apps, Collaboration, Developer Platform, Enterprise Software, Messaging, Productivity Tools, Video Chat',
       'Food Delivery', 'Industrial Automation',
       'Automotive, Search Engine, Service Industry',
       'Finance, Internet, Travel',
       'Accounting, Business Information Systems, Business Travel, Finance, SaaS',
       'Artificial Intelligence, Product Search, SaaS, Service Industry, Software',
       'Internet of Things, Waste Management',
       'Air Transportation, Freight Service, Logistics, Marine Transport

In [1300]:
data_2018['Sector'].isna().sum()

0

In [1301]:
data_2018[data_2018['Sector'] == 'Consumer']


Unnamed: 0,Company/Brand,Sector,Stage,Amount($),HeadQuarter,What it does,Founders,Investor
179,Colive.in,Consumer,Seed,1800000.0,"Bangalore, Karnataka, India",A technology powered network of Branded Servic...,Unknown,Unknown


In [1302]:
data_2018['Sector'] = data_2018['Sector'].apply(lambda x: 'N/A' if x == '—' else x)
condition = data_2018['Sector'] == 'N/A'
to_be_inputed = data_2018.loc[condition, 'What it does'].values

data_2018.loc[condition, 'Sector'] = to_be_inputed
data_2018

Unnamed: 0,Company/Brand,Sector,Stage,Amount($),HeadQuarter,What it does,Founders,Investor
0,TheCollegeFever,"Brand Marketing, Event Promotion, Marketing, S...",Seed,250000.0,"Bangalore, Karnataka, India","TheCollegeFever is a hub for fun, fiesta and f...",Unknown,Unknown
1,Happy Cow Dairy,"Agriculture, Farming",Seed,584000.0,"Mumbai, Maharashtra, India",A startup which aggregates milk from dairy far...,Unknown,Unknown
2,MyLoanCare,"Credit, Financial Services, Lending, Marketplace",Series A,949000.0,"Gurgaon, Haryana, India",Leading Online Loans Marketplace in India,Unknown,Unknown
3,PayMe India,"Financial Services, FinTech",Angel,2000000.0,"Noida, Uttar Pradesh, India",PayMe India is an innovative FinTech organizat...,Unknown,Unknown
4,Eunimart,"E-Commerce Platforms, Retail, SaaS",Seed,0.0,"Hyderabad, Andhra Pradesh, India",Eunimart is a one stop solution for merchants ...,Unknown,Unknown
...,...,...,...,...,...,...,...,...
521,Udaan,"B2B, Business Development, Internet, Marketplace",Series C,3285000.0,"Bangalore, Karnataka, India","Udaan is a B2B trade platform, designed specif...",Unknown,Unknown
522,Happyeasygo Group,"Tourism, Travel",Series A,0.0,"Haryana, Haryana, India",HappyEasyGo is an online travel domain.,Unknown,Unknown
523,Mombay,"Food and Beverage, Food Delivery, Internet",Seed,7500.0,"Mumbai, Maharashtra, India",Mombay is a unique opportunity for housewives ...,Unknown,Unknown
524,Droni Tech,Information Technology,Seed,511000.0,"Mumbai, Maharashtra, India",Droni Tech manufacture UAVs and develop softwa...,Unknown,Unknown


In [1303]:
data_2018['Sector'].unique()

array(['Brand Marketing, Event Promotion, Marketing, Sponsorship, Ticketing',
       'Agriculture, Farming',
       'Credit, Financial Services, Lending, Marketplace',
       'Financial Services, FinTech',
       'E-Commerce Platforms, Retail, SaaS',
       'Cloud Infrastructure, PaaS, SaaS',
       'Internet, Leisure, Marketplace', 'Market Research',
       'Information Services, Information Technology', 'Mobile Payments',
       'B2B, Shoes', 'Internet',
       'Apps, Collaboration, Developer Platform, Enterprise Software, Messaging, Productivity Tools, Video Chat',
       'Food Delivery', 'Industrial Automation',
       'Automotive, Search Engine, Service Industry',
       'Finance, Internet, Travel',
       'Accounting, Business Information Systems, Business Travel, Finance, SaaS',
       'Artificial Intelligence, Product Search, SaaS, Service Industry, Software',
       'Internet of Things, Waste Management',
       'Air Transportation, Freight Service, Logistics, Marine Transport

#### Create a function that pushes specific keywords or expression into a particluar list. This will be used to recategorize the sectors

In [1304]:
# Changing industries that are just have consumer to 'Business Consumer upon further investigation since we have just 2 
# companies like that before calling the sector redistribution function

import re

data_2018['Sector'] = data_2018['Sector'].apply(lambda x: 'Business Consumer' if x == 'Consumer' else x)
known_sectors = data_2018['Sector'].unique()

finance = []
tech = []
beauty = []
education = [] 
food = []
sports = []
hospitality = []
commerce = [] 
manufacturing = []
agriculture = []
health = []
government = []
entertainment = []
business_intelligence = []
transport = []
lifestyle =[]
energy =[]
real_estate = []


def sector_redistribution(known_sectors):
    for sector in known_sectors:
        if re.search('Bank|Fintech|Financial|Crypto|Account|Credit|Block|Crowd|Lending|Trading Platform|Wealth Management|Insurance|finance|credit|insurance|remittance|money|wealth', sector):
            finance.append(sector)
        elif re.search('Automotive|Air Transportation|Logistics|Autonomous Vehicle|Vehicle|Transportation|Delivery|Rental|vehicles|Tyre|fleet|Wheels', sector):
            transport.append(sector)
        elif re.search('Clean Energy|Energy', sector):
            energy.append(sector)
        elif re.search('Analytics|Consulting|Human|Career|ERP|Advertising|Market Research|business ', sector):
            business_intelligence.append(sector)
        elif re.search('Intelligence|Tech|Crypto|Cloud|Artificial|Data|net|Things|Apps|droid|Software|Computer|Mobile|3D Printing|Funding Platform|Applications|File|Embedded Systems|Online Portals|Fraud Detection|Search Engine|Nanotechnology|security|AI',
                        sector):
            tech.append(sector)
        elif re.search('Beauty|Cosmetic|Fashion|Eyewear|cosmetics ', sector):
            beauty.append(sector)
        elif re.search('Decor|Fitness|Training|Wellness', sector):
            lifestyle.append(sector)
        elif re.search('Edutech|education|Learn|Children|Child Care|Collaboration', sector):
            education.append(sector)
        elif re.search('Food|Bev|Catering|tering|Cook|food', sector):
            food.append(sector)
        elif re.search('Sports|eSports|Fantasy Sports|Games|ball', sector):
            sports.append(sector)
        elif re.search('Customer|Service|Hospital|Tourism|Events|Wedding|Travel|hosts|booking', sector):
            hospitality.append(sector)
        elif re.search('B2B|trade|enterpise|Commerce|commerce|Business|Commercial|Consumer Goods|Marketplace|Business Consumer|Marketing|Retail', sector):
            commerce.append(sector)
        elif re.search('Dental|Health|Health Insurance|Medic|Supplement|Biopharma|Veterinary', sector):
            health.append(sector)
        elif re.search('Agric|agric|Biotechnology|Industrial|Farming', sector):
            agriculture.append(sector)
        elif re.search('Battery|Manufacturing|Electronics|Industrial Automation|Aerospace|conductor|gaming', sector):
            manufacturing.append(sector)
        elif re.search('Communities|Smart Cities|Government|Classifieds', sector):
            government.append(sector)
        elif re.search('Media|Dating|Music|News|Audio|Gaming|Creative|Entertainment|Broadcasting', sector):
            entertainment.append(sector)
        elif re.search('Apartment|real estate|Home', sector):
            entertainment.append(sector)

        data_2018['Sector'] = data_2018["Sector"].apply(lambda x: 'Finance' if x in finance else x)
        data_2018['Sector'] = data_2018["Sector"].apply(lambda x: 'Technology' if x in tech else x)
        data_2018['Sector'] = data_2018["Sector"].apply(lambda x: 'Beauty' if x in beauty else x)
        data_2018['Sector'] = data_2018["Sector"].apply(lambda x: 'Education' if x in education else x)
        data_2018['Sector'] = data_2018["Sector"].apply(lambda x: 'Food & Beverages' if x in food else x)
        data_2018['Sector'] = data_2018["Sector"].apply(lambda x: 'Sports' if x in sports else x)
        data_2018['Sector'] = data_2018["Sector"].apply(lambda x: 'Hospitality' if x in hospitality else x)
        data_2018['Sector'] = data_2018["Sector"].apply(lambda x: 'Commerce' if x in commerce else x)
        data_2018['Sector'] = data_2018["Sector"].apply(lambda x: 'Manufacturing' if x in manufacturing else x)
        data_2018['Sector'] = data_2018["Sector"].apply(lambda x: 'Agriculture' if x in agriculture else x)
        data_2018['Sector'] = data_2018["Sector"].apply(lambda x: 'Health' if x in health else x)
        data_2018['Sector'] = data_2018["Sector"].apply(lambda x: 'Government' if x in government else x)
        data_2018['Sector'] = data_2018["Sector"].apply(lambda x: 'Entertainment' if x in entertainment  else x)
        data_2018['Sector'] = data_2018["Sector"].apply(lambda x: 'Business Intelligence' if x in business_intelligence else x)
        data_2018['Sector'] = data_2018["Sector"].apply(lambda x: 'Transport' if x in transport else x)
        data_2018['Sector'] = data_2018["Sector"].apply(lambda x: 'Lifestyle' if x in lifestyle else x)
        data_2018['Sector'] = data_2018["Sector"].apply(lambda x: 'Energy' if x in energy else x)
        data_2018['Sector'] = data_2018["Sector"].apply(lambda x: 'Real Estate' if x in real_estate else x)
       

sector_redistribution(known_sectors)


In [1306]:
data_2018[data_2018['Sector'] == 'N/A'].shape

(0, 8)

In [1307]:
data_2018['Sector'].unique()

array(['Commerce', 'Agriculture', 'Finance', 'Technology',
       'Business Intelligence', 'Transport', 'Food & Beverages',
       'Education', 'Beauty', 'Energy', 'Lifestyle', 'Hospitality',
       'Entertainment', 'Health', 'Sports', 'Government', 'Manufacturing'],
      dtype=object)

In [1308]:
data_2018['Sector'].unique().shape

(17,)

### Creating a function to remove the all excess sectors form the Sector column except the first words before a comma

In [1309]:
def remove_excess_headquaters(string):
    length = len(string)
    new = []
    for word in string:
        new += word
    if ',' in new:
        comma_index = string.index(',')
        del new[comma_index:length]
        ''.join(new)
        return ''.join(new)
    
data_2018['HeadQuarter'] = data_2018['HeadQuarter'].apply(remove_excess_headquaters)
data_2018.head()

Unnamed: 0,Company/Brand,Sector,Stage,Amount($),HeadQuarter,What it does,Founders,Investor
0,TheCollegeFever,Commerce,Seed,250000.0,Bangalore,"TheCollegeFever is a hub for fun, fiesta and f...",Unknown,Unknown
1,Happy Cow Dairy,Agriculture,Seed,584000.0,Mumbai,A startup which aggregates milk from dairy far...,Unknown,Unknown
2,MyLoanCare,Finance,Series A,949000.0,Gurgaon,Leading Online Loans Marketplace in India,Unknown,Unknown
3,PayMe India,Finance,Angel,2000000.0,Noida,PayMe India is an innovative FinTech organizat...,Unknown,Unknown
4,Eunimart,Commerce,Seed,0.0,Hyderabad,Eunimart is a one stop solution for merchants ...,Unknown,Unknown


In [1310]:
# data_2019['Amount($)'] = data_2019['Amount($)'].apply(lambda x: str(x).replace('$', ""))
# data_2019['Amount($)'] = data_2019['Amount($)'].apply(lambda x: str(x).replace('Undisclosed', "0"))
# data_2019['Amount($)'] = data_2019['Amount($)'].apply(lambda x: str(x).replace(',', ""))
# data_2019['Amount($)'] = data_2019['Amount($)'].astype(float)
# data_2019.info()


In [1311]:
# data_2020['Amount($)'] = data_2020['Amount($)'].apply(lambda x: str(x).replace('$', ""))
# data_2020['Amount($)'] = data_2020['Amount($)'].apply(lambda x: str(x).replace('Undisclosed', "0"))
# data_2020['Amount($)'] = data_2020['Amount($)'].apply(lambda x: str(x).replace(',', ""))
# data_2020['Amount($)'] = data_2020['Amount($)'].apply(lambda x: str(x).replace('nan', "0"))
# data_2020['Amount($)'] = data_2020['Amount($)'].apply(lambda x: str(x).replace('', "0"))
# data_2020['Amount($)'] = data_2020['Amount($)'].astype(float)
# data_2020.info()