In [1]:
# Supress Warnings

import warnings
warnings.filterwarnings('ignore')

In [3]:
# Import the numpy, pandas and chardet packages

import pandas as pd

# Checkpoint 1: Data Cleaning

In [4]:
# Load Companies and Rounds2 data into it's respctive variables.

companies = pd.read_csv("companies.txt",sep="\\t")
rounds2 = pd.read_csv("rounds2.csv", encoding = "ISO-8859-1")

In [5]:
# Data Cleaning, remove special characters from data frame companies and rounds2 for columns permalink and 
# company_permalink and then convert column names permalink and company_permalink 
# of companies and rounds2 dataframe to lower case.

rounds2['company_permalink'] = rounds2[['company_permalink']].applymap(lambda x: x.encode('utf-8').decode('ascii', 'ignore'))
companies['permalink'] = companies[['permalink']].applymap(lambda x: x.encode('utf-8').decode('ascii', 'ignore'))

rounds2['company_permalink'] = pd.DataFrame(rounds2.company_permalink.str.lower())
companies['permalink'] = pd.DataFrame(companies.permalink.str.lower())


In [6]:
# Remove double quotes from from permalink and company_permalink columns of companies and rounds2

rounds2['company_permalink'] = rounds2['company_permalink'].str.replace('"','')
companies['permalink'] = companies['permalink'].str.replace('"','')

### Question: How many unique companies are present in rounds2?

In [7]:
print(rounds2.company_permalink.unique().size)

66368


### Question: How many unique companies are present in companies?

In [9]:
print(companies.permalink.unique().size)

66368


### Question: In the companies data frame, which column can be used as the unique key for each company? Write the name of the column.

In [10]:
## Permalink column in Company Dataframe is unique for each company

### Question: Are there any companies in the rounds2 file which are not present in companies? Answer yes or no: Y/N

In [11]:
# Uncomment below line to find the companies which are in rounds2 and not in companies
rounds2[~rounds2.company_permalink.isin(companies.permalink)]
# Answer: N

Unnamed: 0,company_permalink,funding_round_permalink,funding_round_type,funding_round_code,funded_at,raised_amount_usd


### Merge the two data frames so that all variables (columns) in the companies frame are added to the rounds2 data frame. Name the merged frame master_frame. How many observations are present in master_frame?


In [12]:
master_frame = pd.merge(rounds2, companies, how="left", left_on='company_permalink', right_on='permalink').drop('permalink', axis=1)
master_frame

Unnamed: 0,company_permalink,funding_round_permalink,funding_round_type,funding_round_code,funded_at,raised_amount_usd,name,homepage_url,category_list,status,country_code,state_code,region,city,founded_at
0,/organization/-fame,/funding-round/9a01d05418af9f794eebff7ace91f638,venture,B,05-01-2015,10000000.0,#fame,http://livfame.com,Media,operating,IND,16,Mumbai,Mumbai,
1,/organization/-qounter,/funding-round/22dacff496eb7acb2b901dec1dfe5633,venture,A,14-10-2014,,:Qounter,http://www.qounter.com,Application Platforms|Real Time|Social Network...,operating,USA,DE,DE - Other,Delaware City,04-09-2014
2,/organization/-qounter,/funding-round/b44fbb94153f6cdef13083530bb48030,seed,,01-03-2014,700000.0,:Qounter,http://www.qounter.com,Application Platforms|Real Time|Social Network...,operating,USA,DE,DE - Other,Delaware City,04-09-2014
3,/organization/-the-one-of-them-inc-,/funding-round/650b8f704416801069bb178a1418776b,venture,B,30-01-2014,3406878.0,"""(THE) ONE of THEM,Inc.""",http://oneofthem.jp,Apps|Games|Mobile,operating,,,,,
4,/organization/0-6-com,/funding-round/5727accaeaa57461bd22a9bdd945382d,venture,A,19-03-2008,2000000.0,0-6.com,http://www.0-6.com,Curated Web,operating,CHN,22,Beijing,Beijing,01-01-2007
5,/organization/004-technologies,/funding-round/1278dd4e6a37fa4b7d7e06c21b3c1830,venture,,24-07-2014,,004 Technologies,http://004gmbh.de/en/004-interact,Software,operating,USA,IL,"""Springfield, Illinois""",Champaign,01-01-2010
6,/organization/01games-technology,/funding-round/7d53696f2b4f607a2f2a8cbb83d01839,undisclosed,,01-07-2014,41250.0,01Games Technology,http://www.01games.hk/,Games,operating,HKG,,Hong Kong,Hong Kong,
7,/organization/0ndine-biomedical-inc,/funding-round/2b9d3ac293d5cdccbecff5c8cb0f327d,seed,,11-09-2009,43360.0,Ondine Biomedical Inc.,http://ondinebio.com,Biotechnology,operating,CAN,BC,Vancouver,Vancouver,01-01-1997
8,/organization/0ndine-biomedical-inc,/funding-round/954b9499724b946ad8c396a57a5f3b72,venture,,21-12-2009,719491.0,Ondine Biomedical Inc.,http://ondinebio.com,Biotechnology,operating,CAN,BC,Vancouver,Vancouver,01-01-1997
9,/organization/0xdata,/funding-round/383a9bd2c04f7038bb543ccef5ba3eae,seed,,22-05-2013,3000000.0,H2O.ai,http://h2o.ai/,Analytics,operating,USA,CA,SF Bay Area,Mountain View,01-01-2011


# Checkpoint 2: Funding Type Analysis

In [13]:
# Remove rowns with na/null values for column raised_amount_usd and update company name by removing double quotes from it.
master_frame.dropna(subset=['raised_amount_usd'], how='all', inplace = True)
master_frame['name'] = master_frame['name'].str.replace('"','')

### Question: Average funding amount of venture type?

In [14]:
venture = master_frame.loc[(master_frame.funding_round_type == 'venture') ,:]
venture_avg = round(venture.raised_amount_usd.mean(),2)
print(venture_avg)

11748949.13


### Question: Average funding amount of angel type?

In [15]:
angel = master_frame.loc[(master_frame.funding_round_type == 'angel') ,:]
angel_avg = round(angel.raised_amount_usd.mean(),2)
print(angel_avg)

958694.47


### Question:  Average funding amount of seed type?

In [16]:
seed = master_frame.loc[(master_frame.funding_round_type == 'seed') ,:]
seed_avg = round(seed.raised_amount_usd.mean(),2)
print(seed_avg)

719818.0


### Question:  Average funding amount of private equity type?

In [67]:
private = master_frame.loc[(master_frame.funding_round_type == 'private_equity') ,:]
private_avg = round(private.raised_amount_usd.mean(),2)
print(private_avg)

73308593.03


### Question: Considering that Spark Funds wants to invest between 5 to 15 million USD per investment round, which investment type is the most suitable for it?

In [17]:
### Based on investments made in venture, angel, seed, private funding rounds type,
### most preferred investment is made in Venture funding type which has ~11.75 Million USD investments made
### Answer: Venture

# Checkpoint 3 : Country Analysis

### Top nine countries which have received the highest total funding across ALL sectors for the chosen investment type - Venture

In [18]:
ven = venture.groupby(['country_code'], as_index=False).sum()
ven = ven.sort_values(by=['raised_amount_usd'], ascending = False)
#ven
top9=ven.head(9)
top9

Unnamed: 0,country_code,raised_amount_usd
94,USA,422510800000.0
15,CHN,39835420000.0
29,GBR,20245630000.0
39,IND,14391860000.0
12,CAN,9583332000.0
28,FRA,7259537000.0
42,ISR,6907515000.0
21,DEU,6346960000.0
45,JPN,3363677000.0


### Top 3 English speaking countries

In [19]:
#1. Top English-speaking country:  USA
#2. Second English-speaking country: GBR
#3. Third English-speaking country: IND

# Checkpoint 4: Sector Analysis

In [20]:
##Importing thr mapping.csv
mapping = pd.read_csv("mapping.csv", encoding = "ISO-8859-1")

In [21]:
##using melt function to map each category to one of the sectors given
mapping1=pd.melt(mapping, id_vars=['category_list'],var_name='main_sector')
mapping1=mapping1.loc[mapping1['value']==1]
mapping1

Unnamed: 0,category_list,main_sector,value
8,Adventure Travel,Automotive & Sports,1
14,Aerospace,Automotive & Sports,1
45,Auto,Automotive & Sports,1
46,Automated Kiosk,Automotive & Sports,1
47,Automotive,Automotive & Sports,1
57,Bicycles,Automotive & Sports,1
69,Boating Industry,Automotive & Sports,1
87,CAD,Automotive & Sports,1
93,Cars,Automotive & Sports,1
188,Design,Automotive & Sports,1


In [22]:
#performing data cleaning operations on mapping1 dataframe 
#Dropping the value column as it it no longer required
#Replacing '0' with 'na' in category_list column as few of the categirues are not spelled correctly and has a same pattern.

mapping1.drop('value',axis=1,inplace=True)

mapping1.category_list=mapping1.category_list.str.replace('0','na')
mapping1.category_list=mapping1.category_list.str.replace('2.na','2.0')


In [23]:
##Extracting the primary sector from category_list
venture['primary_sector']=venture["category_list"].str.split("|",n=1, expand = True)[0]
venture

Unnamed: 0,company_permalink,funding_round_permalink,funding_round_type,funding_round_code,funded_at,raised_amount_usd,name,homepage_url,category_list,status,country_code,state_code,region,city,founded_at,primary_sector
0,/organization/-fame,/funding-round/9a01d05418af9f794eebff7ace91f638,venture,B,05-01-2015,10000000.0,#fame,http://livfame.com,Media,operating,IND,16,Mumbai,Mumbai,,Media
3,/organization/-the-one-of-them-inc-,/funding-round/650b8f704416801069bb178a1418776b,venture,B,30-01-2014,3406878.0,"(THE) ONE of THEM,Inc.",http://oneofthem.jp,Apps|Games|Mobile,operating,,,,,,Apps
4,/organization/0-6-com,/funding-round/5727accaeaa57461bd22a9bdd945382d,venture,A,19-03-2008,2000000.0,0-6.com,http://www.0-6.com,Curated Web,operating,CHN,22,Beijing,Beijing,01-01-2007,Curated Web
8,/organization/0ndine-biomedical-inc,/funding-round/954b9499724b946ad8c396a57a5f3b72,venture,,21-12-2009,719491.0,Ondine Biomedical Inc.,http://ondinebio.com,Biotechnology,operating,CAN,BC,Vancouver,Vancouver,01-01-1997,Biotechnology
10,/organization/0xdata,/funding-round/3bb2ee4a2d89251a10aaa735b1180e44,venture,B,09-11-2015,20000000.0,H2O.ai,http://h2o.ai/,Analytics,operating,USA,CA,SF Bay Area,Mountain View,01-01-2011,Analytics
11,/organization/0xdata,/funding-round/ae2a174c06517c2394aed45006322a7e,venture,,03-01-2013,1700000.0,H2O.ai,http://h2o.ai/,Analytics,operating,USA,CA,SF Bay Area,Mountain View,01-01-2011,Analytics
12,/organization/0xdata,/funding-round/e1cfcbe1bdf4c70277c5f29a3482f24e,venture,A,19-07-2014,8900000.0,H2O.ai,http://h2o.ai/,Analytics,operating,USA,CA,SF Bay Area,Mountain View,01-01-2011,Analytics
22,/organization/1-mainstream,/funding-round/b952cbaf401f310927430c97b68162ea,venture,,17-03-2015,5000000.0,1 Mainstream,http://www.1mainstream.com,Apps|Cable|Distribution|Software,acquired,USA,CA,SF Bay Area,Cupertino,01-03-2012,Apps
28,/organization/10-minutes-with,/funding-round/0faccbbcc5818dc5326469f13f5a8ac8,venture,A,09-10-2014,4000000.0,10 Minutes With,http://10minuteswith.com,Education,operating,GBR,H9,London,London,01-01-2013,Education
34,/organization/1000memories,/funding-round/502bd0e50c27616995e4bdad24605ef8,venture,A,16-02-2011,2520000.0,1000memories,http://1000memories.com,Curated Web,acquired,USA,CA,SF Bay Area,San Francisco,01-07-2010,Curated Web


In [24]:
##Converting the primary sector values to lower case before merging
venture['primary_sector'] = pd.DataFrame(venture.primary_sector.str.lower())
mapping1['category_list'] = pd.DataFrame(mapping1.category_list.str.lower())


In [25]:
#Merging the two dataframes to have a associated main sector for each primary sector
venture_sector = pd.merge(venture,mapping1, how="left", left_on='primary_sector', right_on='category_list')
venture_sector

Unnamed: 0,company_permalink,funding_round_permalink,funding_round_type,funding_round_code,funded_at,raised_amount_usd,name,homepage_url,category_list_x,status,country_code,state_code,region,city,founded_at,primary_sector,category_list_y,main_sector
0,/organization/-fame,/funding-round/9a01d05418af9f794eebff7ace91f638,venture,B,05-01-2015,10000000.0,#fame,http://livfame.com,Media,operating,IND,16,Mumbai,Mumbai,,media,media,Entertainment
1,/organization/-the-one-of-them-inc-,/funding-round/650b8f704416801069bb178a1418776b,venture,B,30-01-2014,3406878.0,"(THE) ONE of THEM,Inc.",http://oneofthem.jp,Apps|Games|Mobile,operating,,,,,,apps,apps,"News, Search and Messaging"
2,/organization/0-6-com,/funding-round/5727accaeaa57461bd22a9bdd945382d,venture,A,19-03-2008,2000000.0,0-6.com,http://www.0-6.com,Curated Web,operating,CHN,22,Beijing,Beijing,01-01-2007,curated web,curated web,"News, Search and Messaging"
3,/organization/0ndine-biomedical-inc,/funding-round/954b9499724b946ad8c396a57a5f3b72,venture,,21-12-2009,719491.0,Ondine Biomedical Inc.,http://ondinebio.com,Biotechnology,operating,CAN,BC,Vancouver,Vancouver,01-01-1997,biotechnology,biotechnology,Cleantech / Semiconductors
4,/organization/0xdata,/funding-round/3bb2ee4a2d89251a10aaa735b1180e44,venture,B,09-11-2015,20000000.0,H2O.ai,http://h2o.ai/,Analytics,operating,USA,CA,SF Bay Area,Mountain View,01-01-2011,analytics,analytics,"Social, Finance, Analytics, Advertising"
5,/organization/0xdata,/funding-round/ae2a174c06517c2394aed45006322a7e,venture,,03-01-2013,1700000.0,H2O.ai,http://h2o.ai/,Analytics,operating,USA,CA,SF Bay Area,Mountain View,01-01-2011,analytics,analytics,"Social, Finance, Analytics, Advertising"
6,/organization/0xdata,/funding-round/e1cfcbe1bdf4c70277c5f29a3482f24e,venture,A,19-07-2014,8900000.0,H2O.ai,http://h2o.ai/,Analytics,operating,USA,CA,SF Bay Area,Mountain View,01-01-2011,analytics,analytics,"Social, Finance, Analytics, Advertising"
7,/organization/1-mainstream,/funding-round/b952cbaf401f310927430c97b68162ea,venture,,17-03-2015,5000000.0,1 Mainstream,http://www.1mainstream.com,Apps|Cable|Distribution|Software,acquired,USA,CA,SF Bay Area,Cupertino,01-03-2012,apps,apps,"News, Search and Messaging"
8,/organization/10-minutes-with,/funding-round/0faccbbcc5818dc5326469f13f5a8ac8,venture,A,09-10-2014,4000000.0,10 Minutes With,http://10minuteswith.com,Education,operating,GBR,H9,London,London,01-01-2013,education,education,Others
9,/organization/1000memories,/funding-round/502bd0e50c27616995e4bdad24605ef8,venture,A,16-02-2011,2520000.0,1000memories,http://1000memories.com,Curated Web,acquired,USA,CA,SF Bay Area,San Francisco,01-07-2010,curated web,curated web,"News, Search and Messaging"


# Checkpoint 5: Sector Analysis 2

In [26]:
#Creating the three dataframes D1,D2 & D3 for top three countries having ivestmet type as Venture and fund amount between 
# 5M USD and 15M USD.

D1 = venture_sector.loc[(venture_sector['raised_amount_usd']>=5000000) & (venture_sector['raised_amount_usd']<=15000000) & (venture_sector['country_code']=='USA')]
D2 = venture_sector.loc[(venture_sector['raised_amount_usd']>=5000000) & (venture_sector['raised_amount_usd']<=15000000) & (venture_sector['country_code']=='GBR')]
D3 = venture_sector.loc[(venture_sector['raised_amount_usd']>=5000000) & (venture_sector['raised_amount_usd']<=15000000) & (venture_sector['country_code']=='IND')]


D1.dropna(subset=['main_sector'], how='all', inplace = True)
D2.dropna(subset=['main_sector'], how='all', inplace = True)
D3.dropna(subset=['main_sector'], how='all', inplace = True)


In [27]:
##Adding a separate column with total number/count of investments for each main sector

D1['investments_count']=D1.groupby('main_sector')['raised_amount_usd'].transform('count')
D2['investments_count']=D2.groupby('main_sector')['raised_amount_usd'].transform('count')
D3['investments_count']=D3.groupby('main_sector')['raised_amount_usd'].transform('count')

In [28]:
##Adding a separate column with total amount invested in each main sector
D1['investments_sum']=D1.groupby('main_sector')['raised_amount_usd'].transform('sum')
D2['investments_sum']=D2.groupby('main_sector')['raised_amount_usd'].transform('sum')
D3['investments_sum']=D3.groupby('main_sector')['raised_amount_usd'].transform('sum')


### 1. Total number of investments in each country

In [31]:
print(D1.shape)
print(D2.shape)
print(D3.shape)
## Total Number of investments in USA : 12149
## Total Number of investments in GBR : 628
## Total Number of investments in IND : 330

(12149, 20)
(628, 20)
(330, 20)


### 2.Total amount of investment (USD)

In [35]:
print(D1['raised_amount_usd'].sum())
# Total amount invested in USA: 108521860586.0
print(D2['raised_amount_usd'].sum())
# Total amount invested in GBR: 5436843539.0
print(D3['raised_amount_usd'].sum())
# Total amount invested in IND: 2976543602.0

108521860586.0
5436843539.0
2976543602.0


### 3.Top sector (based on count of investments)

In [36]:
D1SectorCountUniqueVals = D1['investments_count'].unique()
D1SectorCountUniqueVals.sort()

D2SectorCountUniqueVals = D2['investments_count'].unique()
D2SectorCountUniqueVals.sort()

D3SectorCountUniqueVals = D3['investments_count'].unique()
D3SectorCountUniqueVals.sort()


print(D1.loc[D1['investments_count'] == D1SectorCountUniqueVals[-1]].main_sector.head(1))
#Top Sector Name USA : Others
print(D2.loc[D2['investments_count'] == D2SectorCountUniqueVals[-1]].main_sector.head(1))
#Top Sector Name GBR : Others
print(D3.loc[D3['investments_count'] == D3SectorCountUniqueVals[-1]].main_sector.head(1))
#Top Sector Name IND : Others

33    Others
Name: main_sector, dtype: object
836    Others
Name: main_sector, dtype: object
84    Others
Name: main_sector, dtype: object


### 4.Second Best Sector (based on count of investments)

In [37]:
print(D1.loc[D1['investments_count'] == D1SectorCountUniqueVals[-2]].main_sector.head(1))
#Top Sector Name USA : Social, Finance, Analytics, Advertising
print(D2.loc[D2['investments_count'] == D2SectorCountUniqueVals[-2]].main_sector.head(1))
#Top Sector Name GBR : Social, Finance, Analytics, Advertising
print(D3.loc[D3['investments_count'] == D3SectorCountUniqueVals[-2]].main_sector.head(1))
#Top Sector Name IND : Social, Finance, Analytics, Advertising

6    Social, Finance, Analytics, Advertising
Name: main_sector, dtype: object
161    Social, Finance, Analytics, Advertising
Name: main_sector, dtype: object
423    Social, Finance, Analytics, Advertising
Name: main_sector, dtype: object


### 5.Third best Sector (based on count of investments)

In [38]:
print(D1.loc[D1['investments_count'] == D1SectorCountUniqueVals[-3]].main_sector.head(1))
#Top Sector Name USA : Cleantech / Semiconductors
print(D2.loc[D2['investments_count'] == D2SectorCountUniqueVals[-3]].main_sector.head(1))
#Top Sector Name GBR : Cleantech / Semiconductors
print(D3.loc[D3['investments_count'] == D3SectorCountUniqueVals[-3]].main_sector.head(1))
#Top Sector Name IND : News, Search and Messaging

60    Cleantech / Semiconductors
Name: main_sector, dtype: object
469    Cleantech / Semiconductors
Name: main_sector, dtype: object
4886    News, Search and Messaging
Name: main_sector, dtype: object


### 6. Number of investments in the top sector

In [39]:
print(D1SectorCountUniqueVals[-1])
#Number of investments in the top sector USA : 2950
print(D2SectorCountUniqueVals[-1])
#Number of investments in the top sector GBR : 147
print(D3SectorCountUniqueVals[-1])
#Number of investments in the top sector IND : 110

2950
147
110


### 7. Number of investments in the second best sector

In [40]:
print(D1SectorCountUniqueVals[-2])
#Number of investments in the top sector USA : 2714
print(D2SectorCountUniqueVals[-2])
#Number of investments in the top sector GBR : 133
print(D3SectorCountUniqueVals[-2])
#Number of investments in the top sector IND : 60

2714
133
60


### 8. Number of investments in the third best sector

In [41]:
print(D1SectorCountUniqueVals[-3])
#Number of investments in the top sector USA : 2350
print(D2SectorCountUniqueVals[-3])
#Number of investments in the top sector GBR : 130
print(D3SectorCountUniqueVals[-3])
#Number of investments in the top sector IND : 52

2350
130
52


### 9. For the top sector count-wise (point 3), which company received the highest investment?

In [43]:
temp_df1 = D1.loc[D1['investments_count']==D1SectorCountUniqueVals[-1]]
temp_df1_group = temp_df1.groupby("name", as_index=False)
groupped_data_df1 = pd.DataFrame(temp_df1_group['raised_amount_usd'].sum())
print(groupped_data_df1.sort_values(by='raised_amount_usd', ascending = False).name.head(1))
#Which company received the highest investment in USA from D1: Virtustream

temp_df2 = D2.loc[D2['investments_count']==D2SectorCountUniqueVals[-1]]
temp_df2_group = temp_df2.groupby("name", as_index=False)
groupped_data_df2 = pd.DataFrame(temp_df2_group['raised_amount_usd'].sum())
print(groupped_data_df2.sort_values(by='raised_amount_usd', ascending = False).name.head(1))
#Which company received the highest investment in GBR from D2: Electric Cloud


temp_df3 = D3.loc[D3['investments_count']==D3SectorCountUniqueVals[-1]]
temp_df3_group = temp_df3.groupby("name", as_index=False)
groupped_data_df3 = pd.DataFrame(temp_df3_group['raised_amount_usd'].sum())
print(groupped_data_df3.sort_values(by='raised_amount_usd', ascending = False).name.head(1))
#Which company received the highest investment in Ind from D3: FirstCry.com


1877    Virtustream
Name: name, dtype: object
31    Electric Cloud
Name: name, dtype: object
25    FirstCry.com
Name: name, dtype: object


###  10. For the second-best sector count-wise (point 4), which company received the highest investment?

In [44]:
temp_df1 = D1.loc[D1['investments_count']==D1SectorCountUniqueVals[-2]]
temp_df1_group = temp_df1.groupby("name", as_index=False)
groupped_data_df1 = pd.DataFrame(temp_df1_group['raised_amount_usd'].sum())
print(groupped_data_df1.sort_values(by='raised_amount_usd', ascending = False).name.head(1))
#Which company received the second highest investment in USA from D1: SST Inc. (Formerly ShotSpotter)

temp_df2 = D2.loc[D2['investments_count']==D2SectorCountUniqueVals[-2]]
temp_df2_group = temp_df2.groupby("name", as_index=False)
groupped_data_df2 = pd.DataFrame(temp_df2_group['raised_amount_usd'].sum())
print(groupped_data_df2.sort_values(by='raised_amount_usd', ascending = False).name.head(1))
#Which company received the second highest investment in GBR from D2: Celltick Technologies

temp_df3 = D3.loc[D3['investments_count']==D3SectorCountUniqueVals[-2]]
temp_df3_group = temp_df3.groupby("name", as_index=False)
groupped_data_df3 = pd.DataFrame(temp_df3_group['raised_amount_usd'].sum())
print(groupped_data_df3.sort_values(by='raised_amount_usd', ascending = False).name.head(1))
#Which company received the second highest investment in IND from D3: Manthan Systems

1321    SST Inc. (Formerly ShotSpotter)
Name: name, dtype: object
18    Celltick Technologies
Name: name, dtype: object
28    Manthan Systems
Name: name, dtype: object


## Creating CSV File for Master, Top9 and Venture dataframe to be able to use for plotting purpose

In [45]:
master_frame.to_csv('master_frame.csv',index=False)
top9.to_csv('top9.csv',index=False)
venture_sector1_master = pd.concat([D1,D2 ,D3])
venture_sector1_master.to_csv('venture_sector.csv',index=False)