# Number of Fundings

In [2]:
from collections import Counter
import pandas as pd
data = pd.read_csv('startup_funding.csv', skipinitialspace=True)
# data['Date'][34:]

data['Date'] = data['Date'].str.replace('/', '.')
data['Date'] = data['Date'].str.split('.')
data['Year'] = data['Date'].str[-1].astype(int)
data['AmountInUSD'] = data['AmountInUSD'].str.replace(',', '')
data = data.fillna(0)

yearDic = Counter(data['Year'])

for year in sorted(yearDic.keys()):
    print(year, yearDic[year])

2015 936
2016 993
2017 443


# Top Indian Cities

In [1]:
from collections import Counter
import pandas as pd
import operator
data = pd.read_csv('startup_funding.csv', skipinitialspace=True)

data = data.fillna('None')

rep = {'delhi': 'new delhi'}

data['CityLocation'] = data.CityLocation.str.lower()
data['CityLocation'] = data['CityLocation'].str.partition('/')
data['CityLocation'] = data['CityLocation'].str.strip()
data['CityLocation'] = data.CityLocation.replace(rep)
data = Counter(data['CityLocation'])
del data['none']

data = sorted(data.items(), key=operator.itemgetter(1), reverse=True)[:10]

for i in data:
    name = ' '.join([x.capitalize() for x in i[0].split()])
    print(name, i[1])


Bangalore 635
Mumbai 449
New Delhi 389
Gurgaon 241
Pune 91
Noida 79
Hyderabad 77
Chennai 67
Ahmedabad 35
Jaipur 25


# Funding amount

In [13]:
from collections import Counter
import pandas as pd
import operator
data = pd.read_csv('startup_funding.csv', skipinitialspace=True)

# Empty values fill
data['AmountInUSD'] = data['AmountInUSD'].fillna('0,0')
data['CityLocation'] = data['CityLocation'].fillna('None')

# AmountInUSD contains ','
data['AmountInUSD'] = data['AmountInUSD'].str.replace(',','')
data['AmountInUSD'] = data['AmountInUSD'].astype(int)

# Delhi -> New Delhi
rep = {'delhi': 'new delhi'}

# Banglore, banglore/us -> 'banglore' only
data['CityLocation'] = data.CityLocation.str.lower()
data['CityLocation'] = data['CityLocation'].str.partition('/')
data['CityLocation'] = data['CityLocation'].str.strip()
data['CityLocation'] = data.CityLocation.replace(rep)

data = data.groupby('CityLocation').sum()

# Unneccessary columns and rows
data = data.drop(index='none')
data = data.drop(columns='SNo')

# finding the top10 cities
top10 = data.sort_values(by=['AmountInUSD'], ascending=False)[:10]
totalFunding = top10['AmountInUSD'].sum()

# Converting df to dict
for key, value in top10.to_dict()['AmountInUSD'].items():
    # new delhi -> 'New Delhi'
    key = ' '.join([x.capitalize() for x in key.split()])
    value = (value / totalFunding) * 100
    print ('{} {:.2f}'.format(key, value))

Bangalore 49.71
New Delhi 16.63
Mumbai 13.90
Gurgaon 12.21
Chennai 2.43
Pune 2.16
Hyderabad 1.15
Noida 1.01
Ahmedabad 0.58
Jaipur 0.21


# Investment Type

In [41]:
from collections import Counter
import pandas as pd
import operator
data = pd.read_csv('startup_funding.csv', skipinitialspace=True)

# Empty values fill
data['AmountInUSD'] = data['AmountInUSD'].fillna('0,0')
data['InvestmentType'] = data['InvestmentType'].fillna('None')

# AmountInUSD contains ','
data['AmountInUSD'] = data['AmountInUSD'].str.replace(',','')
data['AmountInUSD'] = data['AmountInUSD'].astype(int)

# Investment type name fix
data['InvestmentType'] = data['InvestmentType'].str.lower()
data['InvestmentType'] = data['InvestmentType'].str.replace(' ', '')

totalinvestment = data['AmountInUSD'].sum()

rep = {'privateequity': 'Private Equity', 'seedfunding': 'Seed Funding', 
       'debtfunding': 'Debt Funding', 'crowdfunding': 'Crowd Funding'}

data['InvestmentType'] = data['InvestmentType'].replace(rep)


investment_dict = Counter(data['InvestmentType'])
del investment_dict['none']

for key in investment_dict:
    investment_dict[key] = (data[data['InvestmentType'] == key]['AmountInUSD'].sum() / totalinvestment) * 100
    print("{} {:.2f}".format(key, investment_dict[key]))
    

Private Equity 98.15
Seed Funding 1.81
Debt Funding 0.04
Crowd Funding 0.00


# Top Industries

In [8]:
from collections import Counter
import pandas as pd
import operator
data = pd.read_csv('startup_funding.csv', skipinitialspace=True)

# Empty values fill
data['AmountInUSD'] = data['AmountInUSD'].fillna('0,0')
data = data.fillna('None')

rep = {'ecommerce': 'Ecommerce', 'consumer interne': 'consumer internet'}

data['IndustryVertical'] = data['IndustryVertical'].str.lower()
data['IndustryVertical'] = data['IndustryVertical'].replace(rep)
sorted(Counter(data['IndustryVertical']))

['360-degree view creating platform',
 '3d printer manufacturer',
 'Ecommerce',
 'activity based social network',
 'advertising & marketing community networking platform',
 'affordable education',
 'affordable hotel booking online',
 'affordable personal healthcare products',
 'algorithmic match making platform',
 'alternate mobile monetization platform',
 'anonymous bulletin board app',
 'api workflow platform',
 'app analytics platform',
 'app based bus pooling services',
 'app based fitness coaching',
 'app security\xa0 testing platform',
 'architectural design & consulting',
 'artificial intelligence ecommerce chatbot',
 'artificial intelligence platform',
 'artist / designer marketplace',
 'asset financing platform',
 'auto',
 'auto insurance online platform',
 'auto rickshaw based logistics',
 'auto rickshaw based services',
 'automated storage & warehousing solution',
 'automotive services platform',
 'autorickshaw aggregator & booking platform',
 'b2b ecommerce marketplace',
 '

# Top Investor

In [75]:
from collections import Counter
import pandas as pd
import operator
data = pd.read_csv('startup_funding.csv', skipinitialspace=True)

# Empty values fill
data['AmountInUSD'] = data['AmountInUSD'].fillna('0,0')
data = data.fillna('None')

data = data.sort_values('InvestorsName')
Counter(data['InvestorsName'])

Counter({'1Crowd': 1,
         '1Crowd (through crowd funding)': 1,
         '1Crowd (through crowdfunding)': 1,
         '1Crowd, Eureka Forbes Ltd, Shapoorji Pallonji & Co. Ltd.': 1,
         '3 undisclosed HNIs': 1,
         '3 undisclosed investors': 1,
         '3One4 Capital': 1,
         '3one4 Capital, Mumbai Angels, Aarin Capital': 1,
         '3one4 Capital, Tracxn Labs, Aaruha Technology Fund, Endiya Partners': 1,
         '3one4 capital': 1,
         '500 Startups': 3,
         '500 Startups, IDG Ventures & Advantedge fund, Neeraj Arora, Leon Seynave': 1,
         '500 Startups, IvyCap Ventures': 1,
         '500 Startups, Littlerock, Singularity Ventures': 1,
         '500 Startups, Mato Peric & Others': 1,
         '500 Startups, Mato Peric, TracxnLabs': 1,
         '500 Startups, Purvi Capital, Rajan Anandan, Abhishek Gupta': 1,
         '500 Startups, Smile Multimedia, Kunal Bahl, Rohit Bansal, Girish Matrubootham': 1,
         '500 Startups, TV Mohandas Pai, Tandem Cap

# Top Industries

In [76]:
from collections import Counter
import pandas as pd
import operator
data = pd.read_csv('startup_funding.csv', skipinitialspace=True)

# Empty values fill
data['AmountInUSD'] = data['AmountInUSD'].fillna('0,0')
data = data.fillna('None')

# AmountInUSD contains ','
data['AmountInUSD'] = data['AmountInUSD'].str.replace(',','')
data['AmountInUSD'] = data['AmountInUSD'].astype(int)

temp = data.index[data['IndustryVertical'].str.lower() == 'ecommerce']

data.at[temp, 'IndustryVertical'] = 'Ecommerce'
data = data.groupby('IndustryVertical').sum()
data = data.sort_values(by='AmountInUSD', ascending=False)
data = data.drop(index= 'None')
del data['SNo']

data = data[:5]
total = data['AmountInUSD'].sum()

ans = dict(zip(data.index.values.tolist(), data['AmountInUSD'].tolist()))
for i in ans: 
    print("{} {:.2f}".format(i, (ans[i] * 100)/total))

Ecommerce 40.53
Consumer Internet 35.95
Technology 10.45
Online Marketplace 6.63
E-Commerce & M-Commerce platform 6.44


# Top startups

In [96]:
from collections import Counter
import pandas as pd
import operator
data = pd.read_csv('startup_funding.csv', skipinitialspace=True)

# Empty values fill
data['AmountInUSD'] = data['AmountInUSD'].fillna('0,0')
data = data.fillna('None')

# AmountInUSD contains ','
data['AmountInUSD'] = data['AmountInUSD'].str.replace(',','')
data['AmountInUSD'] = data['AmountInUSD'].astype(int)

ola = {'Ola Cabs': 'Ola', 'Olacabs': 'Ola','Paytm Marketplace': 'Paytm', 'Flipkart.com': 'Flipkart',
       'OyoRooms': 'Oyo', 'Oyo Rooms': 'Oyo', 'OYO Rooms': 'Oyo', 'OyoRooms': 'Oyo', 'Oyorooms': 'Oyo'}
data = data.replace(ola)
data = data.groupby('StartupName').sum()
data = data.sort_values(by='AmountInUSD', ascending=False)
del data['SNo']

data = data[:5]
total = data['AmountInUSD'].sum()

for i in data.index.values.tolist(): 
    print(i)

Paytm
Flipkart
Ola
Snapdeal
Oyo


# Funding Rounds

In [103]:
from collections import Counter
import pandas as pd
import operator
data = pd.read_csv('startup_funding.csv', skipinitialspace=True)

# Empty values fill
data['AmountInUSD'] = data['AmountInUSD'].fillna('0,0')
data = data.fillna('None')

# AmountInUSD contains ','
data['AmountInUSD'] = data['AmountInUSD'].str.replace(',','')
data['AmountInUSD'] = data['AmountInUSD'].astype(int)

ola = {'Ola Cabs': 'Ola', 'Olacabs': 'Ola','Paytm Marketplace': 'Paytm', 'Flipkart.com': 'Flipkart',
       'OyoRooms': 'Oyo', 'Oyo Rooms': 'Oyo', 'OYO Rooms': 'Oyo', 'OyoRooms': 'Oyo', 'Oyorooms': 'Oyo'}
data = data.replace(ola)
temp = Counter(data['StartupName'])
temp = sorted(temp.items(), key=operator.itemgetter(1), reverse=True)[:5]
for i in temp:
    print(i[0], i[1])

Ola 9
Swiggy 7
UrbanClap 6
Paytm 6
Oyo 6


# Top Investor

In [146]:
from collections import Counter
import pandas as pd
import numpy as np
import operator

data = pd.read_csv('startup_funding.csv', skipinitialspace=True)
rep = {'Undisclosed Investors': 'None', 'Undisclosed investors': 'None', 'Undisclosed Investor': 'None',
      'Undisclosed investor': 'None', 'Undisclosed': 'None'}
data['InvestorsName'] = data['InvestorsName'].replace(rep)
data['InvestorsName'] = data['InvestorsName'].str.split(',')

temp = np.array(data['InvestorsName'].tolist())
temp = np.char.strip(np.hstack(temp), ' ').tolist()
investors = Counter(temp)
investors = sorted(investors.items(), key=operator.itemgetter(1), reverse=True)[:5]
print(investors[1][0], investors[1][1])

Sequoia Capital 64
