## Importing xlsx

In [1]:
#%pip install openpyxl
#%pip install xlrd

In [2]:
import pandas as pd
import numpy as np
from apifunctions import *
import datetime

pd.set_option("display.max_rows", None, "display.max_columns", None)

In [3]:
wacc=pd.read_excel("../data/datos_Bloomberg/wacc.xlsx")
prices=pd.read_excel("../data/datos_Bloomberg/prices.xlsx")
sales_growth=pd.read_excel("../data/datos_Bloomberg/sales_growth.xlsx")
parameters=pd.read_excel("../data/datos_Bloomberg/parameters.xlsx")
market_cap=pd.read_csv("../data/datos_Bloomberg/market_cap.csv")
shares_outstanding=pd.read_excel("../data/datos_Bloomberg/shares_outstanding.xlsx")

In [4]:
market_cap=pd.read_csv("../data/datos_Bloomberg/market_cap.csv")
shares_outstanding=pd.read_excel("../data/datos_Bloomberg/shares_outstanding.xlsx")

In [5]:
company_list=wacc.ID

## ID's as index

In [6]:
datasets=[wacc,prices,sales_growth,market_cap,shares_outstanding]

for i in datasets:
    i.set_index("ID",inplace=True)

## Dealing with NANs

In [7]:
# We first want to delete the rows which have all NANs for the wacc, prices and sales_growth dataframes

datasets=[wacc,prices,sales_growth,market_cap,shares_outstanding]

for i in datasets:
    i.dropna(axis=0, how='all',inplace=True)   

#### For simplicity, in prices we are going to delete all the rows that have nans as that means the company was not trading at that point so it wont allow us to do the backtesting:

In [8]:
prices.dropna(axis=0,inplace=True)

#### Now we are going to delete the companies for which we dont have information in one of the three datasets

In [9]:
remove_columns(prices,wacc,sales_growth,market_cap,shares_outstanding)
remove_columns(prices,wacc,sales_growth,market_cap,shares_outstanding)

#### To deal with the rest of NANs in wacc and sales_growth we are going to fill them with the average of the values in its time range

In [13]:
fill_na_mean(wacc)
fill_na_mean(sales_growth)

#### At this point we have cleaned the three dataframes: wacc, prices, sales growth. Now we need to deal with the parameters one

In [14]:
final_company_list=wacc.index

In [15]:
deleted_companies=[]

for i in company_list:
    
    if i not in final_company_list:
        
        deleted_companies.append(i)

### Parameters dataframe

#### We first create column with the year only and we set the dates as index and transpose the dataframe to have it in the same format as the rest:

In [16]:
lista=[]

for i in parameters["Unnamed: 0"]:
    
    lista.append(str(i))

year=[]
for j in lista:
    year.append(j[:4])
    
    

In [17]:
parameters["dates"]=year
parameters_new=parameters.groupby("dates").sum()

In [18]:
parameters_new_t=parameters_new.transpose()

In [19]:
parameters_new_t["company_name"]=parameters_new_t.index

#### we add a column named company name with the ticker of each company

In [20]:
parameters_new_t["company_name"]=parameters_new_t["company_name"].str.replace('\.\d+', '')

#### As we dont have values for 2022 we drop the entire column

In [21]:
parameters_new_t=parameters_new_t.drop(["2022"],axis=1)

#### We convert the numbers to float and then delete the rows which have at least one missing value

In [22]:
#parameters_new_t[["2010","2011","2012","2013","2014","2015","2016","2017","2018","2019","2020","2021"]].astype(dtype="float64")

In [23]:
parameters_new_t=parameters_new_t[~(parameters_new_t[["2010","2011","2012","2013","2014","2015","2016","2017","2018","2019","2020","2021"]]==0).any(axis=1)]

#### Now we need to check for which companies we have full data

In [24]:
companies_we_have=parameters_new_t["company_name"]

In [25]:
final_comps=["IFF UN Equity ","NTAP UW Equity","ATO UN Equity","GWW UN Equity",     "UHS UN Equity ",     "WEC UN Equity ",     "SWKS UW Equity",     "HSY UN Equity ",     "DGX UN Equity",     "HRL UN Equity",     "EW UN Equity" ,      "MDLZ UW Equity" ,    "ATVI UW Equity",     "HUM UN Equity",      "ROK UN Equity",      "ITW UN Equity",     "TT UN Equity",       "IPG UN Equity",      "WM UN Equity",       "J UN Equity",        "BR UN Equity",       "GPC UN Equity",      "GIS UN Equity",      "GD UN Equity",       "KLAC UW Equity",     "COST UW Equity",     "PCAR UW Equity",     "GOOG UW Equity",     "AEE UN Equity",      "ECL UN Equity",      "EMR UN Equity",      "ODFL UW Equity",     "AON UN Equity",      "DVA UN Equity",      "CBRE UN Equity",     "MNST UW Equity",    "CTAS UW Equity",     "EL UN Equity",       "BRO UN Equity",      "AAPL UW Equity",     "AMGN UW Equity",     "KMX UN Equity",      "MA UN Equity",       "KMB UN Equity",     "PM UN Equity"  ,     "NDAQ UW Equity" ,    "SO UN Equity",   "BKNG UW Equity",  "MCO UN Equity", "OMC UN Equity","OKE UN Equity",      "PWR UN Equity",      "PH UN Equity",       "ROL UN Equity",      "PPL UN Equity",      "AME UN Equity",      "NOC UN Equity",     "RSG UN Equity" ,     "ISRG UW Equity",     "PPG UN Equity",      "CTSH UW Equity",     "HSIC UW Equity",     "RHI UN Equity",      "WST UN Equity",      "FDS UN Equity",      "FFIV UW Equity",     "ES UN Equity",       "UNH UN Equity",      "CHRW UW Equity",     "LLY UN Equity",      "APH UN Equity",      "ULTA UW Equity",     "ANTM UN Equity" ,    "LOW UN Equity",      "IEX UN Equity",      "MMC UN Equity",      "SPGI UN Equity",     "ACN UN Equity",      "AKAM UW Equity",     "CVS UN Equity",      "TXN UW Equity",      "SYY UN Equity",      "GOOGL UW Equity",    "TDG UN Equity",      "YUM UN Equity",      "NKE UN Equity",      "MKTX UW Equity",     "DOV UN Equity",      "ANSS UW Equity",     "DE UN Equity",       "PAYX UW Equity",     "ORLY UW Equity",     "BWA UN Equity",      "BIIB UW Equity",     "HON UW Equity ",    "WMT UN Equity",      "CSCO UW Equity",     "INTC UW Equity",     "MSFT UW Equity ",    "DG UN Equity",       "CI UN Equity",       "HAS UW Equity",      "AMCR UN Equity",    "UPS UN Equity",      "HCA UN Equity",      "TGT UN Equity",      "MHK UN Equity" ,     "FISV UW Equity",    "PG UN Equity",       "CNC UN Equity",      "APD UN Equity",      "AWK UN Equity",      "EQIX UW Equity",     "AOS UN Equity" ,     "CAT UN Equity",      "LKQ UW Equity",     "KO UN Equity",       "APTV UN Equity" ,    "INTU UW Equity",     "FLT UN Equity",      "IDXX UW Equity",     "ROST UW Equity",     "ROP UN Equity",      "HD UN Equity",       "MPWR UW Equity",    "QCOM UW Equity",     "MCD UN Equity",      "MRK UN Equity",      "MMM UN Equity",      "STE UN Equity" ,     "WBA UW Equity",      "CPRT UW Equity",     "FAST UW Equity",     "NDSN UW Equity",     "BBY UN Equity",     "NVR UN Equity",      "ALB UN Equity" ,     "EPAM UN Equity",     "BF/B UN Equity",     "CPB UN Equity",      "IPGP UW Equity",     "MTD UN Equity",      "RMD UN Equity",      
"TSCO UW Equity",     "AMAT UW Equity",     "CLX UN Equity",      "CMS UN Equity",      "WAB UN Equity",      "POOL UW Equity",     "CAG UN Equity",      "AZO UN Equity",      "DHR UN Equity",      "CMI UN Equity",      "EXPD UW Equity",     "ADM UN Equity",      "ADP UW Equity",      "VRSK UW Equity",     "CL UN Equity",       "LMT UN Equity",      "V UN Equity",        "ED UN Equity",       "MSCI UN Equity",     
"WAT UN Equity"]      

In [26]:
companies_to_use=[]

for i in final_comps:
    
    if i in final_company_list:
        
        companies_to_use.append(i)

In [27]:
wacc=wacc/100

In [28]:
sales_growth=sales_growth/100

In [29]:
parameters_new_t[["2010","2011","2012","2013","2014","2015","2016","2017","2018","2019","2020","2021"]][parameters_new_t["DATE"]=="EBITDA_TO_REVENUE"]=parameters_new_t[["2010","2011","2012","2013","2014","2015","2016","2017","2018","2019","2020","2021"]][parameters_new_t["company_name"]=="EBITDA_TO_REVENUE"]/100

In [30]:
parameters_new_t[["2010","2011","2012","2013","2014","2015","2016","2017","2018","2019","2020","2021"]][parameters_new_t["DATE"]=="EBITDA_TO_REVENUE"]=parameters_new_t[["2010","2011","2012","2013","2014","2015","2016","2017","2018","2019","2020","2021"]]/100

In [31]:
companies_to_use=pd.DataFrame(companies_to_use)

In [38]:
wacc.to_csv("../data/wacc.csv")
prices.to_csv("../data/prices.csv")
sales_growth.to_csv("../data/sales_growth.csv")
parameters_new_t.to_csv("../data/parameters_new_t.csv")
companies_to_use.to_csv("../data/companies_to_use.csv")
market_cap.to_csv("../data/market_cap.csv")
shares_outstanding.to_csv("../data/shares_outstanding.csv")