<a href="https://colab.research.google.com/github/GemmaRea/Analisi-Start-Up-Indiane/blob/main/Indian_Startups_Funding_Data.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

<a name="section0"></a>
#**Setup**

In [None]:
import numpy as np
import pandas as pd
pd.set_option('display.float_format', '{:.2f}'.format)
import matplotlib.pyplot as plt
import seaborn as sns
from google.colab import auth
from google.cloud import bigquery
from google.colab import data_table
from google.colab import files

project = 'sac-2023-388512' # Project ID inserted based on the query results selected to explore
location = 'US' # Location inserted based on the query results selected to explore
client = bigquery.Client(project=project, location=location)
data_table.enable_dataframe_formatter()
auth.authenticate_user()

#**Indice**

- [startup_funding2018](#section1)
- [startup_funding2019](#section2)
- [startup_funding2020](#section3)
- [startup_funding2021](#section4)
- [startup_funding2022](#section5)
- [Startup_Funding](#section7)
- [Download](#section6)

<a name="section1"></a>
#**PULIZIA DATI startup_funding2018**
- [To the top](#section0)

In [None]:
query_year_2018 = """
  SELECT *
  FROM `sac-2023-388512.Indian_Startups_Funding_Data.fundinf_2018`
"""

year_2018 = client.query(query_year_2018).to_dataframe()
year_2018 = year_2018.rename(columns = {
                                'string_field_0': 'company_name',
                                'string_field_1': 'industry',
                                'string_field_2': 'stage',
                                'string_field_3': 'amount',
                                'string_field_4': 'location',
                                'string_field_5': 'about'
                            })
year_2018["founded"] = None
year_2018 = year_2018[["company_name", "founded","industry", "location", "about", "stage", "amount"]]
year_2018

Unnamed: 0,company_name,founded,industry,location,about,stage,amount
0,Tripshelf,,"Internet, Leisure, Marketplace","Kalkaji, Delhi, India",Tripshelf is an online market place for holida...,Seed,"₹16,000,000"
1,Freshboxx,,Food Delivery,"Hubli, Karnataka, India","Freshboxx is incubated at Sandbox Startups, a ...",Seed,—
2,Tolet for Students,,Hospitality,"Jodhpur, Rajasthan, India","Reserve your Room, Hostel or Paying Guest, whi...",Seed,"₹5,000,000"
3,Dainik Jagran,,"Media and Entertainment, News, Outdoors","Kanpur, Uttar Pradesh, India",Dainik Jagran is a media and communications gr...,Seed,"₹40,000,000"
4,Wishup,,"Consumer Applications, Information Services, L...","Azadpur, Delhi, India",Premium Personal Assistance service,Seed,—
...,...,...,...,...,...,...,...
522,Ola,,"Apps, E-Commerce, Internet, Mobile, Ride Shari...","Kormangala, Karnataka, India",Ola is a mobile app that brings together cab d...,Venture - Series Unknown,50000000
523,Shopkirana,,"E-Commerce, Mobile, Retail","Indore, Madhya Pradesh, India",Shopkirana connects brands and traditional ret...,Venture - Series Unknown,"$2,000,000"
524,Cleardekho,,"Eyewear, Internet","Ghaziabad, Uttar Pradesh, India",Uttar Pradesh based online eyewear marketplace.,Venture - Series Unknown,—
525,MadGuy Labs,,E-Learning,"Hyderabad, Andhra Pradesh, India",MadGuy Labs is a Online Test-prep Platform.,Venture - Series Unknown,"$150,000"


In [None]:
year_2018_clear = year_2018[year_2018['amount'].str.startswith('$') | year_2018['amount'].str.startswith('₹')].copy()
check_00 = year_2018_clear[year_2018_clear["amount"].str.endswith(",00")].copy()
check_dot = year_2018_clear[year_2018_clear["amount"].str.contains('.')].copy()
#check_dot #non ci sono '.' nei valori
#check_00 #non ci sono valori che finiscono con ",00"
year_2018_clear

Unnamed: 0,company_name,founded,industry,location,about,stage,amount
0,Tripshelf,,"Internet, Leisure, Marketplace","Kalkaji, Delhi, India",Tripshelf is an online market place for holida...,Seed,"₹16,000,000"
2,Tolet for Students,,Hospitality,"Jodhpur, Rajasthan, India","Reserve your Room, Hostel or Paying Guest, whi...",Seed,"₹5,000,000"
3,Dainik Jagran,,"Media and Entertainment, News, Outdoors","Kanpur, Uttar Pradesh, India",Dainik Jagran is a media and communications gr...,Seed,"₹40,000,000"
5,FoodBuddy,,"Food Delivery, Online Portals, Restaurants","Belgaum, Karnataka, India","FoodBuddy is a online food delivery portal, pr...",Seed,"₹60,000,000"
8,Log 9 Materials,,Nanotechnology,"Uttar Pradesh, India, Asia",Log 9 Materials is a nano-materials manufactur...,Seed,"₹30,000,000"
...,...,...,...,...,...,...,...
519,Myra,,"Apps, Health Care, Pharmaceutical","Bangalore, Karnataka, India",Myra is a unique solution of technology and op...,Venture - Series Unknown,"₹8,750,000"
520,DRIVEU,,"Rental, Taxi Service, Travel","Bengaluru, Karnataka, India",DriveU is a convenient and a quick way of gett...,Venture - Series Unknown,"₹70,000,000"
521,Lavelle Networks,,"Cloud Computing, Enterprise Software, Network ...","Bengaluru, Karnataka, India",Lavelle Networks provides Software Defined WAN...,Venture - Series Unknown,"₹20,000,000"
523,Shopkirana,,"E-Commerce, Mobile, Retail","Indore, Madhya Pradesh, India",Shopkirana connects brands and traditional ret...,Venture - Series Unknown,"$2,000,000"


In [None]:
year_2018_clear["amount"] = year_2018_clear['amount'].str.replace(',', '')

In [None]:
year_2018_clear.reset_index(inplace = True)

In [None]:
#for _ in year_2018_clear:
year_2018_clear['amount_usd_in_eur'] = year_2018_clear.loc[year_2018_clear['amount'].str.startswith('$'), 'amount'].str.replace('$', '').astype(int)
year_2018_clear['amount_inr_in_eur'] = year_2018_clear.loc[year_2018_clear['amount'].str.startswith('₹'), 'amount'].str.replace('₹', '').astype(int)
year_2018_clear['amount_usd_in_eur'].fillna(0, inplace = True)
year_2018_clear['amount_inr_in_eur'].fillna(0, inplace = True)
year_2018_clear

  year_2018_clear['amount_usd_in_eur'] = year_2018_clear.loc[year_2018_clear['amount'].str.startswith('$'), 'amount'].str.replace('$', '').astype(int)


Unnamed: 0,index,company_name,founded,industry,location,about,stage,amount,amount_usd_in_eur,amount_inr_in_eur
0,0,Tripshelf,,"Internet, Leisure, Marketplace","Kalkaji, Delhi, India",Tripshelf is an online market place for holida...,Seed,₹16000000,0.00,16000000.00
1,2,Tolet for Students,,Hospitality,"Jodhpur, Rajasthan, India","Reserve your Room, Hostel or Paying Guest, whi...",Seed,₹5000000,0.00,5000000.00
2,3,Dainik Jagran,,"Media and Entertainment, News, Outdoors","Kanpur, Uttar Pradesh, India",Dainik Jagran is a media and communications gr...,Seed,₹40000000,0.00,40000000.00
3,5,FoodBuddy,,"Food Delivery, Online Portals, Restaurants","Belgaum, Karnataka, India","FoodBuddy is a online food delivery portal, pr...",Seed,₹60000000,0.00,60000000.00
4,8,Log 9 Materials,,Nanotechnology,"Uttar Pradesh, India, Asia",Log 9 Materials is a nano-materials manufactur...,Seed,₹30000000,0.00,30000000.00
...,...,...,...,...,...,...,...,...,...,...
198,519,Myra,,"Apps, Health Care, Pharmaceutical","Bangalore, Karnataka, India",Myra is a unique solution of technology and op...,Venture - Series Unknown,₹8750000,0.00,8750000.00
199,520,DRIVEU,,"Rental, Taxi Service, Travel","Bengaluru, Karnataka, India",DriveU is a convenient and a quick way of gett...,Venture - Series Unknown,₹70000000,0.00,70000000.00
200,521,Lavelle Networks,,"Cloud Computing, Enterprise Software, Network ...","Bengaluru, Karnataka, India",Lavelle Networks provides Software Defined WAN...,Venture - Series Unknown,₹20000000,0.00,20000000.00
201,523,Shopkirana,,"E-Commerce, Mobile, Retail","Indore, Madhya Pradesh, India",Shopkirana connects brands and traditional ret...,Venture - Series Unknown,$2000000,2000000.00,0.00


In [None]:
year_2018_clear['amount_usd_in_eur'] = year_2018_clear['amount_usd_in_eur'] * 0.93
year_2018_clear['amount_inr_in_eur'] = year_2018_clear['amount_inr_in_eur'] * 0.011
year_2018_clear['location']= year_2018_clear['location'].str.split(',').str[0]
year_2018_clear["amount"] = year_2018_clear["amount_usd_in_eur"] + year_2018_clear["amount_inr_in_eur"]
year_2018_clear["amount"] = year_2018_clear["amount"].astype(int)
year_2018_clear.drop(columns= ["amount_usd_in_eur", "amount_inr_in_eur"], inplace= True)
year_2018_clear

Unnamed: 0,index,company_name,founded,industry,location,about,stage,amount
0,0,Tripshelf,,"Internet, Leisure, Marketplace",Kalkaji,Tripshelf is an online market place for holida...,Seed,176000
1,2,Tolet for Students,,Hospitality,Jodhpur,"Reserve your Room, Hostel or Paying Guest, whi...",Seed,55000
2,3,Dainik Jagran,,"Media and Entertainment, News, Outdoors",Kanpur,Dainik Jagran is a media and communications gr...,Seed,440000
3,5,FoodBuddy,,"Food Delivery, Online Portals, Restaurants",Belgaum,"FoodBuddy is a online food delivery portal, pr...",Seed,660000
4,8,Log 9 Materials,,Nanotechnology,Uttar Pradesh,Log 9 Materials is a nano-materials manufactur...,Seed,330000
...,...,...,...,...,...,...,...,...
198,519,Myra,,"Apps, Health Care, Pharmaceutical",Bangalore,Myra is a unique solution of technology and op...,Venture - Series Unknown,96250
199,520,DRIVEU,,"Rental, Taxi Service, Travel",Bengaluru,DriveU is a convenient and a quick way of gett...,Venture - Series Unknown,770000
200,521,Lavelle Networks,,"Cloud Computing, Enterprise Software, Network ...",Bengaluru,Lavelle Networks provides Software Defined WAN...,Venture - Series Unknown,220000
201,523,Shopkirana,,"E-Commerce, Mobile, Retail",Indore,Shopkirana connects brands and traditional ret...,Venture - Series Unknown,1860000


In [None]:
year_2018_clear['industry']= year_2018_clear['industry'].str.split(',').str[0]
year_2018_clear.drop("index", axis= 1, inplace= True)

In [None]:
year_2018_clear[year_2018_clear.duplicated()] #controllo dei duplicati
year_2018_clear["industry"].replace("—", None, inplace= True)
year_2018_clear["about"] = year_2018_clear["about"].astype(str)
year_2018_clear["Table"] = 2018
year_2018_clear

Unnamed: 0,company_name,founded,industry,location,about,stage,amount,Table
0,Tripshelf,,Internet,Kalkaji,Tripshelf is an online market place for holida...,Seed,176000,2018
1,Tolet for Students,,Hospitality,Jodhpur,"Reserve your Room, Hostel or Paying Guest, whi...",Seed,55000,2018
2,Dainik Jagran,,Media and Entertainment,Kanpur,Dainik Jagran is a media and communications gr...,Seed,440000,2018
3,FoodBuddy,,Food Delivery,Belgaum,"FoodBuddy is a online food delivery portal, pr...",Seed,660000,2018
4,Log 9 Materials,,Nanotechnology,Uttar Pradesh,Log 9 Materials is a nano-materials manufactur...,Seed,330000,2018
...,...,...,...,...,...,...,...,...
198,Myra,,Apps,Bangalore,Myra is a unique solution of technology and op...,Venture - Series Unknown,96250,2018
199,DRIVEU,,Rental,Bengaluru,DriveU is a convenient and a quick way of gett...,Venture - Series Unknown,770000,2018
200,Lavelle Networks,,Cloud Computing,Bengaluru,Lavelle Networks provides Software Defined WAN...,Venture - Series Unknown,220000,2018
201,Shopkirana,,E-Commerce,Indore,Shopkirana connects brands and traditional ret...,Venture - Series Unknown,1860000,2018


<a name="section2"></a>
#**PULIZIA DATI startup_funding2019**
- [To the top](#section0)


In [None]:
query_year_2019 = """
  SELECT *
  FROM `sac-2023-388512.Indian_Startups_Funding_Data.funding_2019`
"""

year_2019 = client.query(query_year_2019).to_dataframe()
year_2019 = year_2019.rename(columns = {
                                'Company_Brand': 'company_name',
                                'Sector': 'industry',
                                'Stage': 'stage',
                                'Amount___': 'amount',
                                'HeadQuarter': 'location',
                                'What_it_does': 'about',
                                'Founded': 'founded'
                            })
year_2019 = year_2019[["company_name", "founded","industry", "location", "about", "stage", "amount"]]
year_2019

Unnamed: 0,company_name,founded,industry,location,about,stage,amount
0,Bombay Shaving,,Ecommerce,,Provides a range of male grooming products,,"$6,300,000"
1,Quantiphi,,AI & Tech,,It is an AI and big data services company prov...,Series A,"$20,000,000"
2,Open Secret,,Food tech,,It produces and sells top quality snacks,,Undisclosed
3,Fireflies .ai,,AI,,Developer of an artificial intelligence-powere...,,"$5,000,000"
4,truMe,,IoT,,A global platform for Identity and Access Mana...,,"$140,000"
...,...,...,...,...,...,...,...
84,Moms Co,,E-commerce,New Delhi,It is into mother and baby care-focused consum...,Series B,"$5,000,000"
85,Ess Kay Fincorp,,Banking,Rajasthan,Organised Non-Banking Finance Company,,"$33,000,000"
86,Nu Genes,2004,AgriTech,Telangana,"It is a seed company engaged in production, pr...",,"$6,000,000"
87,Pumpkart,2014,E-marketplace,Chandigarh,B2B model for appliances and electrical products,,Undisclosed


In [None]:
year_2019_clear = year_2019[year_2019['amount'].str.startswith('$')].copy()
year_2019_clear

Unnamed: 0,company_name,founded,industry,location,about,stage,amount
0,Bombay Shaving,,Ecommerce,,Provides a range of male grooming products,,"$6,300,000"
1,Quantiphi,,AI & Tech,,It is an AI and big data services company prov...,Series A,"$20,000,000"
3,Fireflies .ai,,AI,,Developer of an artificial intelligence-powere...,,"$5,000,000"
4,truMe,,IoT,,A global platform for Identity and Access Mana...,,"$140,000"
5,VMate,,,,A short video platform,,"$100,000,000"
...,...,...,...,...,...,...,...
83,Froogal,,Marketing & Customer loyalty,Hyderabad,A cloud based Customer Loyalty & Engagement Pl...,Pre series A,"$1,000,000"
84,Moms Co,,E-commerce,New Delhi,It is into mother and baby care-focused consum...,Series B,"$5,000,000"
85,Ess Kay Fincorp,,Banking,Rajasthan,Organised Non-Banking Finance Company,,"$33,000,000"
86,Nu Genes,2004,AgriTech,Telangana,"It is a seed company engaged in production, pr...",,"$6,000,000"


In [None]:
year_2019_clear["amount"] = year_2019_clear['amount'].str.replace(',', '')
year_2019_clear['amount_usd_in_eur'] = year_2019_clear.loc[year_2019_clear['amount'].str.startswith('$'), 'amount'].str.replace('$', '').astype(int)
year_2019_clear['amount'] = year_2019_clear['amount_usd_in_eur'] * 0.93
year_2019_clear.drop(columns= "amount_usd_in_eur", inplace= True)

  year_2019_clear['amount_usd_in_eur'] = year_2019_clear.loc[year_2019_clear['amount'].str.startswith('$'), 'amount'].str.replace('$', '').astype(int)


In [None]:
year_2019_clear = year_2019_clear.dropna(how = "all", subset=["industry","founded","location", "stage"])
year_2019_clear.info()

<class 'pandas.core.frame.DataFrame'>
Int64Index: 76 entries, 0 to 88
Data columns (total 7 columns):
 #   Column        Non-Null Count  Dtype  
---  ------        --------------  -----  
 0   company_name  76 non-null     object 
 1   founded       52 non-null     Int64  
 2   industry      72 non-null     object 
 3   location      61 non-null     object 
 4   about         76 non-null     object 
 5   stage         40 non-null     object 
 6   amount        76 non-null     float64
dtypes: Int64(1), float64(1), object(5)
memory usage: 4.8+ KB


In [None]:
# year_2019_clear[year_2019_clear.duplicated()] #controllo dei duplicati
year_2019_clear["amount"] = year_2019_clear["amount"].astype(int)
year_2019_clear.reset_index(drop= True, inplace= True)
year_2019_clear["Table"] = 2019
year_2019_clear

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  year_2019_clear["amount"] = year_2019_clear["amount"].astype(int)
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  year_2019_clear["Table"] = 2019


Unnamed: 0,company_name,founded,industry,location,about,stage,amount,Table
0,Bombay Shaving,,Ecommerce,,Provides a range of male grooming products,,5859000,2019
1,Quantiphi,,AI & Tech,,It is an AI and big data services company prov...,Series A,18600000,2019
2,Fireflies .ai,,AI,,Developer of an artificial intelligence-powere...,,4650000,2019
3,truMe,,IoT,,A global platform for Identity and Access Mana...,,130200,2019
4,Byju's,2011,Edtech,,Provides online learning classes,,502200000,2019
...,...,...,...,...,...,...,...,...
71,Froogal,,Marketing & Customer loyalty,Hyderabad,A cloud based Customer Loyalty & Engagement Pl...,Pre series A,930000,2019
72,Moms Co,,E-commerce,New Delhi,It is into mother and baby care-focused consum...,Series B,4650000,2019
73,Ess Kay Fincorp,,Banking,Rajasthan,Organised Non-Banking Finance Company,,30690000,2019
74,Nu Genes,2004,AgriTech,Telangana,"It is a seed company engaged in production, pr...",,5580000,2019


<a name="section3"></a>
#**PULIZIA DATI startup_funding2020**
- [To the top](#section0)


In [None]:
query_year_2020 = """
  SELECT *
  FROM `sac-2023-388512.Indian_Startups_Funding_Data.funding_2020`
"""

year_2020 = client.query(query_year_2020).to_dataframe()

year_2020.drop(columns= ["string_field_9", "string_field_5", "string_field_6"], inplace= True)

In [None]:
year_2020 = year_2020.rename(columns = {
                                'string_field_0': 'company_name',
                                'string_field_3': 'industry',
                                'string_field_8': 'stage',
                                'string_field_7': 'amount',
                                'string_field_2': 'location',
                                'string_field_4': 'about',
                                'string_field_1': 'founded'
                            })
year_2020 = year_2020[["company_name", "founded","industry", "location", "about", "stage", "amount"]]
year_2020

Unnamed: 0,company_name,founded,industry,location,about,stage,amount
0,Arth Designbuild,,Construction tech,Hyderebad,Construction technology and solutions provider,,"$1,100,000"
1,Leap India,,Agritech,Coimbatore,Agricultural warehousing and logistics company,Series B,"$30,000,000"
2,Krimanshi,,Agritech,Jodhpur,Sustainable system to feed animals by valorizi...,,"$20,000"
3,Toddle,,,Bengaluru,Collaboration and productivity platform for te...,,Undislosed
4,IncubateHub,,Tech hub,Bengaluru,Provides platform for Corporates to connect es...,,Undisclosed
...,...,...,...,...,...,...,...
1051,Clairvolex,2006,Tech Startup,California,Clairvolex is an IP solutions company that man...,Debt,"$2,000,000"
1052,Udacity,2011,EdTech,California,Udacity develops an online learning platform o...,Debt,"$75,000,000"
1053,Snowflake,2012,Tech company,California,Snowflake is a cloud data platform that provid...,,"$3,000,000,000"
1054,Brinton,2014,HealthTech,California,Brinton is one of the fastest growing Pharmace...,Debt,"$1,300,000"


In [None]:
year_2020["amount"] = year_2020["amount"].fillna("0")
year_2020_clear = year_2020[year_2020['amount'].str.startswith('$')].copy()
year_2020_clear

Unnamed: 0,company_name,founded,industry,location,about,stage,amount
0,Arth Designbuild,,Construction tech,Hyderebad,Construction technology and solutions provider,,"$1,100,000"
1,Leap India,,Agritech,Coimbatore,Agricultural warehousing and logistics company,Series B,"$30,000,000"
2,Krimanshi,,Agritech,Jodhpur,Sustainable system to feed animals by valorizi...,,"$20,000"
6,Zhangmen,2005,Edtech,"Shanghai, China",Zhangmen is an online tutoring platform provid...,,"$400,000,000"
7,Milk Mantra,2009,Food,Odisha,Produces Dairy Products,,"$10,000,000"
...,...,...,...,...,...,...,...
1050,NCOME,2020,Escrow,New Delhi,Escrow-as-a-service platform,,"$400,000"
1051,Clairvolex,2006,Tech Startup,California,Clairvolex is an IP solutions company that man...,Debt,"$2,000,000"
1052,Udacity,2011,EdTech,California,Udacity develops an online learning platform o...,Debt,"$75,000,000"
1053,Snowflake,2012,Tech company,California,Snowflake is a cloud data platform that provid...,,"$3,000,000,000"


In [None]:
year_2020_clear["amount"] = year_2020_clear["amount"].str.replace(",", "").str.replace("$","").str.replace('800000000 to 850000000', "825000000").str.replace("887000 23000000", "11943500")
year_2020_clear["amount"] = year_2020_clear["amount"].str.strip().astype(int)

  year_2020_clear["amount"] = year_2020_clear["amount"].str.replace(",", "").str.replace("$","").str.replace('800000000 to 850000000', "825000000").str.replace("887000 23000000", "11943500")


In [None]:
year_2020_clear["amount"] = year_2020_clear["amount"] * 0.93
year_2020_clear['location']= year_2020_clear['location'].str.split(',').str[0]
year_2020_clear

Unnamed: 0,company_name,founded,industry,location,about,stage,amount
0,Arth Designbuild,,Construction tech,Hyderebad,Construction technology and solutions provider,,1023000.00
1,Leap India,,Agritech,Coimbatore,Agricultural warehousing and logistics company,Series B,27900000.00
2,Krimanshi,,Agritech,Jodhpur,Sustainable system to feed animals by valorizi...,,18600.00
6,Zhangmen,2005,Edtech,Shanghai,Zhangmen is an online tutoring platform provid...,,372000000.00
7,Milk Mantra,2009,Food,Odisha,Produces Dairy Products,,9300000.00
...,...,...,...,...,...,...,...
1050,NCOME,2020,Escrow,New Delhi,Escrow-as-a-service platform,,372000.00
1051,Clairvolex,2006,Tech Startup,California,Clairvolex is an IP solutions company that man...,Debt,1860000.00
1052,Udacity,2011,EdTech,California,Udacity develops an online learning platform o...,Debt,69750000.00
1053,Snowflake,2012,Tech company,California,Snowflake is a cloud data platform that provid...,,2790000000.00


In [None]:
year_2020_clear[year_2020_clear.duplicated()] #controllo dei duplicati
year_2020_clear.drop_duplicates(keep= "first", inplace= True)
year_2020_clear["amount"] = year_2020_clear["amount"].astype(int)
year_2020_clear.reset_index(drop= True, inplace= True)
year_2020_clear["Table"] = 2020
year_2020_clear

Unnamed: 0,company_name,founded,industry,location,about,stage,amount,Table
0,Arth Designbuild,,Construction tech,Hyderebad,Construction technology and solutions provider,,1023000,2020
1,Leap India,,Agritech,Coimbatore,Agricultural warehousing and logistics company,Series B,27900000,2020
2,Krimanshi,,Agritech,Jodhpur,Sustainable system to feed animals by valorizi...,,18600,2020
3,Zhangmen,2005,Edtech,Shanghai,Zhangmen is an online tutoring platform provid...,,372000000,2020
4,Milk Mantra,2009,Food,Odisha,Produces Dairy Products,,9300000,2020
...,...,...,...,...,...,...,...,...
795,NCOME,2020,Escrow,New Delhi,Escrow-as-a-service platform,,372000,2020
796,Clairvolex,2006,Tech Startup,California,Clairvolex is an IP solutions company that man...,Debt,1860000,2020
797,Udacity,2011,EdTech,California,Udacity develops an online learning platform o...,Debt,69750000,2020
798,Snowflake,2012,Tech company,California,Snowflake is a cloud data platform that provid...,,2790000000,2020


<a name="section4"></a>
#**PULIZIA DATI startup_funding2021**
- [To the top](#section0)

In [None]:
query_year_2021 = """
SELECT *
 FROM `sac-2023-388512.Indian_Startups_Funding_Data.funding_2021`
"""
year_2021 = client.query(query_year_2021).to_dataframe()
year_2021 = year_2021.rename(columns = {"Amount___":"Amount"})
year_2021.at[6, "HeadQuarter"] = "Varun Khanna"
year_2021.at[7, "HeadQuarter"] = "Varun Khanna"
year_2021.at[6, "What_it_does"] = "Primary Business is Development and Manufacturing of Novel Healthcare Products in Effervescent forms using imported propriety ingredients."
year_2021.at[7, "What_it_does"] = "Primary Business is Development and Manufacturing of Novel Healthcare Products in Effervescent forms using imported propriety ingredients."
year_2021.at[6, "Sector"] = "Pharmaceuticals"
year_2021.at[7, "Sector"] = "Pharmaceuticals"
year_2021.at[6, "Amount"] = "22000000"
year_2021.at[7, "Amount"] = " 22000000"
year_2021.at[78, "HeadQuarter"] = "Vikash Mishra, Mragank Jain"
year_2021.at[78, "What_it_does"] = "MoEVing is India's only Electric Mobility focused Technology Platform with a vision to accelerate EV adoption in India."
year_2021.at[78, "Sector"] = "Gurugram"
year_2021.at[78, "Amount"] = "5000000"
year_2021.at[78,"Stage"] ="	Seed"
year_2021.at[142, "Amount"] = "1000000"
year_2021.at[142,"Stage"] ="Pre_series A"
year_2021.at[356,"Amount"] = "300000"
year_2021.at[60,"Amount"] = "1200000"
year_2021.at[61,"Amount"] = "1200000"
year_2021.at[1188,"Amount"] = "300000"
year_2021.at[360,"Amount"] = "6000000"
year_2021.at[589,"Amount"] = "1000000"
year_2021

year_2021 = year_2021[["Company_Brand", "Founded", "Sector", "HeadQuarter", "What_it_does", "Stage", "Amount"]]
year_2021

Unnamed: 0,Company_Brand,Founded,Sector,HeadQuarter,What_it_does,Stage,Amount
0,Lendingkart,1999,FinTech,Gujarat,Lendingkart is an online financing company ded...,Debt,"$15,000,000"
1,Blive,2004,Tourism,Panaji,B: Live is an electric vehicle tourism startup.,Pre-series A,"$1,000,000"
2,Better Capital,2006,Venture Capital & Private Equity,Santra,Better is a top-tier India-focused pre-seed ve...,,$15000000
3,Lenskart,2008,Eyewear,Faridabad,India's fastest growing eyewear company and la...,,$220000000
4,Kredent,2008,EdTech,Kolkata,Kredent Academy is the unique concept where fi...,,$1000000
...,...,...,...,...,...,...,...
1204,GlobalBees,2021,E-commerce,New Delhi,Globalbees partners with entrepreneurs who hav...,Series B,$111000000
1205,GlobalBees,2021,D2C Business,New Delhi,Globalbees partners with entrepreneurs who hav...,Series A,$150000000
1206,Intervue,2021,SaaS startup,New Delhi,World's fastest collaborative environment to t...,Seed,$Undisclosed
1207,Xpand,2021,Retail,New Delhi,LMCE handholds brands and enables their reach ...,Pre-series A,$1500000


In [None]:
year_2021[year_2021.duplicated()] #controllo dei duplicati
year_2021.drop_duplicates(keep= "first", inplace= True)
year_2021.reset_index(drop= True, inplace= True)
year_2021.at[273,"Stage"] = "Seed"
year_2021.at[120,"Amount"] = "Undisclosed"
year_2021.at[811,"Amount"] = "Undisclosed"
year_2021.at[75,"Amount"] = "Undisclosed"
year_2021.at[892,"Amount"] = "Undisclosed"
year_2021.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 1190 entries, 0 to 1189
Data columns (total 7 columns):
 #   Column         Non-Null Count  Dtype 
---  ------         --------------  ----- 
 0   Company_Brand  1190 non-null   object
 1   Founded        1189 non-null   Int64 
 2   Sector         1190 non-null   object
 3   HeadQuarter    1189 non-null   object
 4   What_it_does   1190 non-null   object
 5   Stage          771 non-null    object
 6   Amount         1190 non-null   object
dtypes: Int64(1), object(6)
memory usage: 66.4+ KB


In [None]:
year_2021_clear= year_2021[year_2021['Amount'].str.startswith('$')].copy()
year_2021_clear["Amount"] = year_2021_clear['Amount'].str.strip().str.replace("$","").str.replace("$$","")
year_2021_clear["Amount"] = year_2021_clear['Amount'].str.replace(",","")
year_2021_clear["Amount"] = year_2021_clear['Amount'].str.replace("undisclosed", '0').str.replace("Undisclosed", '0')
year_2021_clear["Amount"] = year_2021_clear["Amount"].astype(float) *0.93
year_2021_clear["Amount"] = year_2021_clear["Amount"].astype(int)
year_2021_clear = year_2021_clear.rename(columns = {
                                'Company_Brand': 'company_name',
                                "Founded": "founded",
                                'Sector': 'industry',
                                'Stage': 'stage',
                                'Amount': 'amount',
                                'HeadQuarter': 'location',
                                'What_it_does': 'about'
                            })
year_2021_clear["Table"] = 2021
year_2021_clear

  year_2021_clear["Amount"] = year_2021_clear['Amount'].str.strip().str.replace("$","").str.replace("$$","")
  year_2021_clear["Amount"] = year_2021_clear['Amount'].str.strip().str.replace("$","").str.replace("$$","")


Unnamed: 0,company_name,founded,industry,location,about,stage,amount,Table
0,Lendingkart,1999,FinTech,Gujarat,Lendingkart is an online financing company ded...,Debt,13950000,2021
1,Blive,2004,Tourism,Panaji,B: Live is an electric vehicle tourism startup.,Pre-series A,930000,2021
2,Better Capital,2006,Venture Capital & Private Equity,Santra,Better is a top-tier India-focused pre-seed ve...,,13950000,2021
3,Lenskart,2008,Eyewear,Faridabad,India's fastest growing eyewear company and la...,,204600000,2021
4,Kredent,2008,EdTech,Kolkata,Kredent Academy is the unique concept where fi...,,930000,2021
...,...,...,...,...,...,...,...,...
1185,GlobalBees,2021,E-commerce,New Delhi,Globalbees partners with entrepreneurs who hav...,Series B,103230000,2021
1186,GlobalBees,2021,D2C Business,New Delhi,Globalbees partners with entrepreneurs who hav...,Series A,139500000,2021
1187,Intervue,2021,SaaS startup,New Delhi,World's fastest collaborative environment to t...,Seed,0,2021
1188,Xpand,2021,Retail,New Delhi,LMCE handholds brands and enables their reach ...,Pre-series A,1395000,2021


<a name="section5"></a>
#**PULIZIA DATI startup_funding2022**
- [To the top](#section0)


In [None]:
query_May = """
  SELECT  *
FROM `sac-2023-388512.Indian_Startups_Funding_Data_2022.May_2022`
"""
May = client.query(query_May).to_dataframe()
May = May.dropna(how = "all", subset=["Company_Name","Founded","Location"])
May = May.dropna(subset=["Company_Name"])
May = May.reset_index(drop = True)
May.at[0, "Amount"] = 3500000.0
May.at[0, "What_it_does"] = "FirstCure Health aims to simplify the surgery experience by bringing the best surgeons with modern and safe procedures at affordable costs"
May.at[0, "Sector"] = "Healthcare,Wellness"
May.at[0, "Location"] = "Noida"
May.at[0, "Stage"] = "Pre-seed"
May.at[0, "Founded"] = None
May.dropna(how= "all", subset= ["Amount"], inplace = True)
May.reset_index(drop= True, inplace= True)
May

Unnamed: 0,Company_Name,Founded,Location,Sector,What_it_does,Founders,Investor,Amount,Stage
0,FirstCure Health,,Noida,"Healthcare,Wellness",FirstCure Health aims to simplify the surgery ...,Pre-seed,,3500000,Pre-seed
1,KiarX,2020.0,Ahemdabad,Mining,KiarX is a mine management tech start-up focus...,,Shuru Up Ventures,15000000,Seed
2,Revoh,2017.0,Chennai,Automobile Manufacturing,Electric vehicle powertrain manufacturing,Vignesh Durai,Vel Kanniappan and Ravi Renganathan,15000000,Seed
3,FlexifyMe,2021.0,Pune,"Healthcare,Wellness","FlexifyMe is to balance your Mind, Body & Soul...",Manjeet Singh,Sachin Anand and Dipen Shah,30000000,Seed
4,Red Basil Technologies,2021.0,Gurgaon,Food&Beverages,Red Basil Technologies is a tech-driven and ze...,,PlanB Capital and Sat Industries,2500000,Seed
5,ForeignAdmits,2018.0,Bengaluru,Career Planning,ForeignAdmits is a mobile career coaching plat...,"Ashwini Jain, Nikhil Jain, Sarthak Agarwal",Beerud Sheth and SEA Fund,67600000,Seed
6,Sploot,2019.0,Gurgaon,Consumer Applications,Sploot is a community-led platform for better ...,,Redstart Labs,50000000,Seed
7,Fanztar,2022.0,Gurgaon,Software,Fanztar is a a Web3 platform for the creator e...,,India Quotient and Farid Ahsan,5000000,Seed
8,NutriTap,2017.0,Gurgaon,Food&Beverages,NutriTap is provides healthy food options in I...,Rajesh Kumar,IK Capital and Venture Catalysts,12000000,Seed
9,Goldenpi,2017.0,Banglore,Financial Services,One stop shop for Bonds and Debentures exclusi...,"Abhijit Roy, Samir Baran Pratihar",Rainmatter Capital and Rainmatter Technology,200000,Seed


In [None]:
query_Jen = """
  SELECT *
FROM `sac-2023-388512.Indian_Startups_Funding_Data_2022.January_2022`
"""
Jen = client.query(query_Jen).to_dataframe()
Jen

Unnamed: 0,Company_Name,Founded,Location,Sector,What_it_does,Founders,Investor,Amount,Stage
0,Pine Labs,1998,Noida,Information Technology & Services,Pine Labs offers a merchant platform that incl...,Amrish Rau,State Bank of India,"$20,000,000",
1,OneDios,2019,Noida,Information Technology & Services,OneDios founded in 2019 is a startup initiati...,Nitin Chawala,"India Angel Network, LetsVenture","$1,200,000",
2,Addverb Technologies,2016,Noida,Industrial Automation,Addverb is a global robotics company based out...,"Sangeet Kumar, Prateek Jain, Bir Singh, Satish...",Reliance,"$132,000,000",
3,Moneyboxx,2018,Mumbai,Financial Services,A NBFC democratising access to capital to the ...,MAYUR MODI,,"$1,000,000",
4,CASHe,2016,Mumbai,Financial Services,CASHe is a credit-enabled financial technology...,Raman,TSLC,"$10,000,000",
...,...,...,...,...,...,...,...,...,...
110,MyCaptain,2013,Bangalore,EdTech,MyCaptain is an ed-tech startup that enables e...,"Mohammed Zeeshan, Sameer Ramesh, Ruhan Naqash",Ankur Capital,"$3,000,000",Pre-series A
111,Finsall,2019,Bangalore,Financial Services,Finsall is an end-to-end technology process fo...,"Prabal Khanna, Tim Mathews",Unicorn India Ventures,"$1,000,000",Pre-series A
112,Cloud Tailor,2020,Hyderabad,Apparel & Fashion,World's Local Cloud Boutique mobile app - Excl...,"Susmitha, Rudra Lakkakula","35North Ventures, Mergerdomo","$1,000,000",Pre-series A
113,Hospals,2018,New Delhi,Hospital & Health Care,Hospals is ‘The most trust able’ medical trave...,"Danish Ahmed, Obaidullah, Suneel Kapur","Inflection Point Ventures, 9Unicorns, Singapor...","$3,500,000",Pre-series A


In [None]:
query_Feb = """
 SELECT *
FROM `sac-2023-388512.Indian_Startups_Funding_Data_2022.February_2022`
"""
Feb = client.query(query_Feb).to_dataframe()
Feb

Unnamed: 0,Company_Name,Founded,Location,Sector,What_it_does,Founders,Investor,Amount,Stage
0,Hero FinCorp,1991,New Delhi,Financial Services,"Delhi-based ?Hero FinCorp?, a non-banking fina...",Abhimanyu Munjal,"Apollo, Hero MotoCorp","$267,000,000",
1,Pine Labs,1998,Noida,Information Technology & Services,A merchant platform company that provides fina...,"Lokvir Kapoor, Rajul Garg, Tarun Upadhyay",Alpha Wave Venture,"$150,000,000",
2,V-Ensure,2010,Mumbai,Pharma,Development of Pharmaceutical dossiers for the...,Sathyanarayana vemula,Investcorp,"$10,000,000",
3,Chargebee,2011,Chennai,Financial Services,Chargebee is a recurring billing and subscript...,"Krish Subramanian, Thiyagarajan T, Rajaraman S...","Tiger Global, Sequoia Capital","$250,000,000",
4,Stellapps,2011,Bangalore,Computer Software,Stellapps is an end-to-end dairy technology so...,Ranjith Mukundan,IDH FarmFit,Undisclosed,
...,...,...,...,...,...,...,...,...,...
91,Chargeup,2019,New Delhi,Renewables & Environment,"Charge-up offers Battery as a Service, solvin...","Varun Goenka, Ankur Madan","Capital A, Anicut Capital","$2,500,000",Pre-series A
92,GoalTeller,2020,Bangalore,Information Technology & Services,GoalTeller is a bootstrapped fintech startup w...,"Vivek Banka, Abhisek Puglia","Dr Ranjan Pai, Pankaj Fitkariwala, Himanshu Bh...","$500,000",Pre-series A
93,Prolance,2020,Bangalore,Furniture,"Prolance, a manufacturing platform for interi...","Rama Harinath K, Vivek Parasuram, Raghunath Gu...","Srini Anumolu, Karthik Bhat","$500,000",Pre-series A
94,ClaimBuddy,2020,Gurgaon,Hospital & Health Care,ClaimBuddy.in is a MediClaim support company t...,"Ajit Patel, Khet Singh","Chiratae Ventures, Rebright Partners","$3,000,000",Pre-series A


In [None]:
query_March = """
  SELECT*
FROM `sac-2023-388512.Indian_Startups_Funding_Data_2022.March_2022`
"""
March = client.query(query_March).to_dataframe()
March

Unnamed: 0,Company_Name,Founded,Location,Sector,What_it_does,Founders,Investor,Amount,Stage
0,Ferns N Petals,1994,New Delhi,Retail,Largest Gifting Chain,"Meeta Gutgutia, Vikaas Gutgutia",Lighthouse,"$27,000,000",
1,Pine Labs,1998,Noida,IT Services and IT Consulting,A merchant platform company that provides fina...,Amrish Rau,Vitruvian Partners,"$50,000,000",
2,SIDBI Venture Capital,1999,Mumbai,Venture Capital and Private Equity Principals,An investment management company and a wholly ...,Debashis Ghosh,Ubharte Sitaare Fund,"$60,000,000",
3,Games24x7,2006,Mumbai,Internet Publishing,Games24x7 is India's leading digital skill gam...,"Trivikraman Thampy, Bhavin Pandya",Malabar Investment,"$75,000,000",
4,Perfios,2008,Bangalore,FinTech,Perfios is a leading product technology compan...,V.R. Govindarajan,"Bessemer Venture Partners, Warburg Pincus","$68,000,000",
...,...,...,...,...,...,...,...,...,...
93,SuperK,2019,"Small Towns, Andhra",Retail,SuperK is a full-stack solution to empower sma...,"Neeraj Menta, Anil Thontepu",021 Capital,"$5,500,000",Pre-series A
94,Junio,2020,New Delhi,Financial Services,The startup’s goal is to nurture discipline an...,"Ankit Gera, Shankar Nath",NB Ventures,"$6,000,000",Pre-series A
95,CARD91,2020,Bangalore,Financial Services,Card91 offers plug & play payment infrastructu...,"Vineet Saxena, Ajay Pandey, Kush Srivastava","Infinity Ventures, Point72 Ventures, Sabre Par...","$13,000,000",Pre-series A
96,Seekho.ai,2021,Gurgaon,E-Learning Providers,Seekho is India's first micro-learning based p...,"Divya Jain, Ajeet Singh Kushwaha, Arihant Jain","LetsVenture, Trica, Super Morpheus","$3,000,000",Pre-series A


In [None]:
query_April = """
SELECT*
FROM `sac-2023-388512.Indian_Startups_Funding_Data_2022.April_2022`
"""
April = client.query(query_April).to_dataframe()
April.at[1, "Amount"] = "66000000.0"
April.at[2, "Amount"] = "270000000.0"
April.at[1 ,"Stage"] = "Seed"
April.at[2,"Stage"] = "Seed"
April.at[1, "What_it_does"] = "BUIDLing World's First Decentralized Notification Protocol on Ethereum"
April.at[2, "What_it_does"] = "	Eximpe is Managing sellers, buyers, processes, payments, and financial services."
April.at[1,"Location"]= "Harsh Rajat, Richa Joshi"
April.at[2,"Location"]= "Arjun Zacharia"
April.at[1,"Sector"]= None
April.at[2,"Sector"]= None
April = April.dropna(how = "all", subset=["Amount"])
April

Unnamed: 0,Company_Name,Founded,Location,Sector,What_it_does,Founders,Investor,Amount,Stage
0,Zeta,2015,San Francisco,Financial services,Zeta is a modern banking tech company providin...,"Bhavin Turakhia, Ramki Gaddipati",Multiples,"$30,000,000",
1,EPNS,2020,"Harsh Rajat, Richa Joshi",,BUIDLing World's First Decentralized Notificat...,"$66,000,000",Seed,66000000.0,Seed
2,Eximpe,2021,Arjun Zacharia,,"\tEximpe is Managing sellers, buyers, processe...","$270,000,000",Seed,270000000.0,Seed
3,Glip,2020,Delaware,Software,Glip is a creator tool suite for gamers to cre...,"Brett Paden, Claudio Pinkus, David Hersh, Jeff...",Better Capita,"$3,000,000",Seed
4,Limechat,2020,Faridabad,Software,Limechat provides a personalised shopping expe...,"Aniket Bajpai, Nikhil Gupta",Pi Ventures and Stellaris Venture Partners,"$5,000,000",Seed
...,...,...,...,...,...,...,...,...,...
90,Frigate,2021,Tiruchirappall,Manufacturing,"Frigate provides fabrication, 3D printing, and...","Adithya Narayanan Seetharaman, Chandrasekar Ch...",Abhishek Pandey and Srinath Ramakkrushnan,"$17,500,000",undisclosed
91,Wildermart,2021,Bengaluru,Food and bevrages,Wildermart is a healthy and sustainable grocer...,,Abhinav Mathur and 17 other investors,"$24,000,000",undisclosed
92,Lauriko,2021,Hyderabad,"Health,wellness",Lauriko is a Manufacture of food products and ...,Lavanya Sunkari,Lakshmikant PB and Murthy Aradhi,"$37,000,000",undisclosed
93,iTribe,2021,Bengaluru,Financial services,iTribe is a one-stop solution for customers to...,"Nikhil,Pruthvi",Eximius Ventures and PlanBcapital,"$1,000,000",undisclosed


In [None]:
year_2022= pd.concat([Jen,Feb,March,April])
year_2022["Amount"] = year_2022["Amount"].fillna("0")
year_2022_clear = year_2022[year_2022['Amount'].str.startswith('$')].copy()
year_2022_clear["Amount"] = year_2022_clear['Amount'].str.strip().str.replace("$","").str.replace(",","").str.replace("Undisclosed", '0').str.replace('Vaibhav Anant', "0").str.replace('Null', "0")
year_2022_clear = pd.concat([year_2022_clear, May])
year_2022_clear["Amount"] = year_2022_clear['Amount'].astype(float) * 0.93
year_2022_clear["Amount"] = year_2022_clear['Amount'].astype(int)
year_2022_clear = year_2022_clear[["Company_Name", "Founded","Sector", "Location", "What_it_does", "Stage", "Amount"]]
year_2022_clear = year_2022_clear.rename(columns = {
                                'Company_Name': 'company_name',
                                "Founded": "founded",
                                'Sector': 'industry',
                                'Stage': 'stage',
                                'Amount': 'amount',
                                'Location': 'location',
                                'What_it_does': 'about'
                            })
year_2022_clear["Table"] = 2022
year_2022_clear

  year_2022_clear["Amount"] = year_2022_clear['Amount'].str.strip().str.replace("$","").str.replace(",","").str.replace("Undisclosed", '0').str.replace('Vaibhav Anant', "0").str.replace('Null', "0")


Unnamed: 0,company_name,founded,industry,location,about,stage,amount,Table
0,Pine Labs,1998,Information Technology & Services,Noida,Pine Labs offers a merchant platform that incl...,,18600000,2022
1,OneDios,2019,Information Technology & Services,Noida,OneDios founded in 2019 is a startup initiati...,,1116000,2022
2,Addverb Technologies,2016,Industrial Automation,Noida,Addverb is a global robotics company based out...,,122760000,2022
3,Moneyboxx,2018,Financial Services,Mumbai,A NBFC democratising access to capital to the ...,,930000,2022
4,CASHe,2016,Financial Services,Mumbai,CASHe is a credit-enabled financial technology...,,9300000,2022
...,...,...,...,...,...,...,...,...
16,Super Bottoms,2014,,Thane,India's First Reusable Baby Diaper brand,Series A,5115000,2022
17,Josh Talks,2015,Broadcasting,Haryana,Josh Talks is a startup that produces videos a...,Series A,465000,2022
18,AssetPlus,2016,Financial Services,Chennai,AssetPlus focuses on offering digital-first so...,Series A,26040000,2022
19,Hono,2008,Software,Haryana,Hono is a provider of HR solutions and services.,Series A,36270000,2022


In [None]:
year_2022[year_2022.duplicated()] #controllo dei duplicati

Unnamed: 0,Company_Name,Founded,Location,Sector,What_it_does,Founders,Investor,Amount,Stage


<a name="section7"></a>
#**Startup_Funding**
- [To the top](#section0)


In [None]:
Startup_funding = pd.concat([year_2018_clear, year_2019_clear, year_2020_clear, year_2021_clear, year_2022_clear])
Startup_funding.reset_index(drop= True, inplace= True)
Startup_funding

Unnamed: 0,company_name,founded,industry,location,about,stage,amount,Table
0,Tripshelf,,Internet,Kalkaji,Tripshelf is an online market place for holida...,Seed,176000,2018
1,Tolet for Students,,Hospitality,Jodhpur,"Reserve your Room, Hostel or Paying Guest, whi...",Seed,55000,2018
2,Dainik Jagran,,Media and Entertainment,Kanpur,Dainik Jagran is a media and communications gr...,Seed,440000,2018
3,FoodBuddy,,Food Delivery,Belgaum,"FoodBuddy is a online food delivery portal, pr...",Seed,660000,2018
4,Log 9 Materials,,Nanotechnology,Uttar Pradesh,Log 9 Materials is a nano-materials manufactur...,Seed,330000,2018
...,...,...,...,...,...,...,...,...
2581,Super Bottoms,2014,,Thane,India's First Reusable Baby Diaper brand,Series A,5115000,2022
2582,Josh Talks,2015,Broadcasting,Haryana,Josh Talks is a startup that produces videos a...,Series A,465000,2022
2583,AssetPlus,2016,Financial Services,Chennai,AssetPlus focuses on offering digital-first so...,Series A,26040000,2022
2584,Hono,2008,Software,Haryana,Hono is a provider of HR solutions and services.,Series A,36270000,2022


<a name="section6"></a>
#**DOWNLOAD**
- [To the top](#section0)


In [None]:
# year_2018_clear.to_csv("Clean_Data_2018.csv", index = False)
# files.download("Clean_Data_2018.csv")

In [None]:
# year_2019_clear.to_csv("Clean_Data_2019.csv", index = False)
# files.download("Clean_Data_2019.csv")

In [None]:
# year_2020_clear.to_csv("Clean_Data_2020.csv", index = False)
# files.download("Clean_Data_2020.csv")

In [None]:
# year_2021_clear.to_csv("Clean_Data_2021.csv", index = False)
# files.download("Clean_Data_2021.csv")

In [None]:
# year_2022_clear.to_csv("Clean_Data_2022.csv", index = False)
# files.download("Clean_Data_2022.csv")

In [None]:
# Startup_funding.to_csv("Startup_funding.csv", index = False)
# files.download("Startup_funding.csv")

#PROVA

In [None]:
b = year_2018_clear.copy()
b["founded"] = 0
a = pd.concat([b, year_2019_clear, year_2020_clear, year_2021_clear, year_2022_clear])
a.reset_index(drop= True, inplace= True)
a = a.dropna()
a.reset_index(drop= True, inplace= True)
a

Unnamed: 0,company_name,founded,industry,location,about,stage,amount,Table
0,Tripshelf,0,Internet,Kalkaji,Tripshelf is an online market place for holida...,Seed,176000,2018
1,Tolet for Students,0,Hospitality,Jodhpur,"Reserve your Room, Hostel or Paying Guest, whi...",Seed,55000,2018
2,Dainik Jagran,0,Media and Entertainment,Kanpur,Dainik Jagran is a media and communications gr...,Seed,440000,2018
3,FoodBuddy,0,Food Delivery,Belgaum,"FoodBuddy is a online food delivery portal, pr...",Seed,660000,2018
4,Log 9 Materials,0,Nanotechnology,Uttar Pradesh,Log 9 Materials is a nano-materials manufactur...,Seed,330000,2018
...,...,...,...,...,...,...,...,...
1580,Humpy Farms,2016,Agriculture,Mumbai,Humpy Farms provides a structured training of ...,Angel,4650000,2022
1581,Josh Talks,2015,Broadcasting,Haryana,Josh Talks is a startup that produces videos a...,Series A,465000,2022
1582,AssetPlus,2016,Financial Services,Chennai,AssetPlus focuses on offering digital-first so...,Series A,26040000,2022
1583,Hono,2008,Software,Haryana,Hono is a provider of HR solutions and services.,Series A,36270000,2022


In [None]:
a.to_csv("Startup_funding_clear.csv", index = False)
files.download("Startup_funding_clear.csv")

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>