In [14]:
# To support both python 2 and python 3
from __future__ import division, print_function, unicode_literals

# Common imports and toolboxes needed for workflow
# System imports
import os
import sys

# Mathematical imports
import numpy as np
import math

# To make this notebook's output stable across runs
np.random.seed(42)

# Data structure imports
import csv
import glob
from collections import Counter # https://docs.python.org/2/library/collections.html
import re
import pandas as pd
from pandas import set_option
set_option('display.max_columns',400)


# Machine Learning and Statistical imports
import scipy
from sklearn.cluster import KMeans

# Scikit-Learn ≥0.20 is required
import sklearn
assert sklearn.__version__ >= "0.20"

# TensorFlow ≥2.0 is required
import tensorflow as tf
from tensorflow import keras
assert tf.__version__ >= "2.0"


# Visualization imports
%matplotlib inline
import matplotlib as mpl
import matplotlib.pyplot as plt
import matplotlib.colors as colors
from matplotlib import image as img
mpl.rc('axes', labelsize=14)
mpl.rc('xtick', labelsize=12)
mpl.rc('ytick', labelsize=12)
plt.rcParams['figure.figsize'] = (100,100)

import seaborn as sns

from bokeh.io import push_notebook, show, output_notebook
from bokeh.models import ColumnDataSource, ColorBar
from bokeh.palettes import Spectral6
from bokeh.transform import linear_cmap
from bokeh.plotting import figure
output_notebook()

# Where to save the figures
PROJECT_ROOT_DIR = "."
IMAGE_ID = "EDA_Images"
IMAGES_PATH = os.path.join(PROJECT_ROOT_DIR, "Images", IMAGE_ID)
os.makedirs(IMAGES_PATH, exist_ok=True)

def save_fig(fig_id, tight_layout=True, fig_extension="png", resolution=300):
    path = os.path.join(IMAGES_PATH, fig_id + "." + fig_extension)
    print("Saving figure", fig_id)
    if tight_layout:
        plt.tight_layout()
    plt.savefig(path, format=fig_extension, dpi=resolution)


# Ignore useless warnings 
import warnings
warnings.filterwarnings('ignore')
warnings.simplefilter('ignore', DeprecationWarning)


In [19]:
%%time
mydir='/Users/Brandon/Documents/GitHub/COMPS/Raw Data/'

def createFileList(myDir, format='.csv'):
    filelist = []
    print('\nCurrent Working Directory:\n', myDir, end='\n')
    
    for root, dirs, files in os.walk(myDir, topdown=False):
        for file in files:
            if file.endswith(format):
                fullName = os.path.join(root, file)
                filelist.append(fullName)
        print('\nList of SIC Data:\n', filelist, end='\n')
    return filelist

filelist = createFileList(mydir)


Current Working Directory:
 /Users/Brandon/Documents/GitHub/COMPS/Raw Data/

List of SIC Data:
 ['/Users/Brandon/Documents/GitHub/COMPS/Raw Data/SIC_0_advancesearch16784737975e1a5b2c8cbeb.csv', '/Users/Brandon/Documents/GitHub/COMPS/Raw Data/SIC_1_advancesearch12906045365e1a5bb125324.csv', '/Users/Brandon/Documents/GitHub/COMPS/Raw Data/SIC_2_advancesearch15616274825e1a5c405bce4.csv', '/Users/Brandon/Documents/GitHub/COMPS/Raw Data/SIC_3_advancesearch16953607965e1a5cf27817a.csv', '/Users/Brandon/Documents/GitHub/COMPS/Raw Data/SIC_4_advancesearch14170920915e1a5dbd6cddc.csv', '/Users/Brandon/Documents/GitHub/COMPS/Raw Data/SIC_5_advancesearch8208422685e1a5e4281b83.csv', '/Users/Brandon/Documents/GitHub/COMPS/Raw Data/SIC_6_advancesearch15668837465e1a60171bf79.csv', '/Users/Brandon/Documents/GitHub/COMPS/Raw Data/SIC_7_advancesearch5468595875e1a60a2066b1.csv', '/Users/Brandon/Documents/GitHub/COMPS/Raw Data/SIC_8_advancesearch19810233385e1a613f38c47.csv', '/Users/Brandon/Documents/GitHu

In [20]:
%%time
# Sort and view the list of images
filelist.sort()
filelist

Wall time: 0 ns


In [21]:
%%time
sic0 = pd.concat(pd.read_excel(filelist[0], sheet_name=None, parse_dates=True, thousands=','), ignore_index=True)
sic1 = pd.concat(pd.read_excel(filelist[1], sheet_name=None, parse_dates=True, thousands=','), ignore_index=True)
sic2 = pd.concat(pd.read_excel(filelist[2], sheet_name=None, parse_dates=True, thousands=','), ignore_index=True)
sic3 = pd.concat(pd.read_excel(filelist[3], sheet_name=None, parse_dates=True, thousands=','), ignore_index=True)
sic4 = pd.concat(pd.read_excel(filelist[4], sheet_name=None, parse_dates=True, thousands=','), ignore_index=True)
sic5 = pd.concat(pd.read_excel(filelist[5], sheet_name=None, parse_dates=True, thousands=','), ignore_index=True)
sic6 = pd.concat(pd.read_excel(filelist[6], sheet_name=None, parse_dates=True, thousands=','), ignore_index=True)
sic7 = pd.concat(pd.read_excel(filelist[7], sheet_name=None, parse_dates=True, thousands=','), ignore_index=True)
sic8 = pd.concat(pd.read_excel(filelist[8], sheet_name=None, parse_dates=True, thousands=','), ignore_index=True)
sic9 = pd.concat(pd.read_excel(filelist[9], sheet_name=None, parse_dates=True, thousands=','), ignore_index=True)

Wall time: 11.7 s


In [22]:
sic0

Unnamed: 0,D-U-N-S@ Number,Company Name,URL,Founding,EIN,Country,State,SIC,Employees,Year3 Total Assets,Year2 Total Assets,Year1 Total Assets,Year3 Current Assets,Year2 Current Assets,Year1 Current Assets,Year3 Total Liabilities,Year2 Total Liabilities,Year1 Total Liabilities,Year3 Long Term Debt,Year2 Long Term Debt,Year1 Long Term Debt,Year3 Stockholders' Equity,Year2 Stockholders' Equity,Year1 Stockholders' Equity,Year3 Total Assets per Share,Year2 Total Assets per Share,Year1 Total Assets per Share,Year3 Current Liabilities,Year2 Current Liabilities,Year1 Current Liabilities,Year3 Net Assets per Share,Year2 Net Assets per Share,Year1 Net Assets per Share,Year3 Total Revenue,Year2 Total Revenue,Year1 Total Revenue,Year3 EBITDA,Year2 EBITDA,Year1 EBITDA,Year3 Operating Income,Year2 Operating Income,Year1 Operating Income,Year3 Net Income,Year2 Net Income,Year1 Net Income,Year3 Revenue per Share,Year2 Revenue per Share,Year1 Revenue per Share,Year3 EPS from Continuing Operations,Year2 EPS from Continuing Operations,Year1 EPS from Continuing Operations,Year3 EPS - Net Income - Diluted,Year2 EPS - Net Income - Diluted,Year1 EPS - Net Income - Diluted,Year3 Share Outstanding,Year2 Share Outstanding,Year1 Share Outstanding,Year3 Weighted Average Shares Outstanding - Basic,Year2 Weighted Average Shares Outstanding - Basic,Year1 Weighted Average Shares Outstanding - Basic,Year3 Weighted Average Shares Outstanding - Diluted,Year2 Weighted Average Shares Outstanding - Diluted,Year1 Weighted Average Shares Outstanding - Diluted,Year3 Earnings per Share - Basic,Year2 Earnings per Share - Basic,Year1 Earnings per Share - Basic,Year3 Cash from Operations,Year2 Cash from Operations,Year1 Cash from Operations,Year3 Cash from Investing,Year2 Cash from Investing,Year1 Cash from Investing,Year3 Cash from Financing,Year2 Cash from Financing,Year1 Cash from Financing,Year3 Capital Expenditures,Year2 Capital Expenditures,Year1 Capital Expenditures,Year3 Cash Flow per Share,Year2 Cash Flow per Share,Year1 Cash Flow per Share,"Year3 Cash & Cash Equivalents, Beginning of Year","Year2 Cash & Cash Equivalents, Beginning of Year","Year1 Cash & Cash Equivalents, Beginning of Year","Year3 Cash & Cash Equivalents, End of Year","Year2 Cash & Cash Equivalents, End of Year","Year1 Cash & Cash Equivalents, End of Year",Year3 Gross Margin,Year2 Gross Margin,Year1 Gross Margin,Year3 Operating Margin,Year2 Operating Margin,Year1 Operating Margin,Year3 EBITDA Margin %,Year2 EBITDA Margin %,Year1 EBITDA Margin %,Year3 Calculated Tax Rate %,Year2 Calculated Tax Rate %,Year1 Calculated Tax Rate %,Year3 Profit Margin (TTM),Year2 Profit Margin (TTM),Year1 Profit Margin (TTM),Year3 Price/Earnings (TTM),Year2 Price/Earnings (TTM),Year1 Price/Earnings (TTM),Year3 Price/Book (TTM),Year2 Price/Book (TTM),Year1 Price/Book (TTM),Year3 Price/Cash Flow(TTM),Year2 Price/Cash Flow(TTM),Year1 Price/Cash Flow(TTM),Year3 Quick Ratio,Year2 Quick Ratio,Year1 Quick Ratio,Year3 Current Ratio,Year2 Current Ratio,Year1 Current Ratio,Year3 Net Current Assets as % of Total Assets,Year2 Net Current Assets as % of Total Assets,Year1 Net Current Assets as % of Total Assets,Year3 Free Cash Flow per Share,Year2 Free Cash Flow per Share,Year1 Free Cash Flow per Share,Year3 Revenue to Assets,Year2 Revenue to Assets,Year1 Revenue to Assets
0,11-681-4324,"CORTEVA, INC.",WWW.CORTEVA.COM,2 18,824979 96,USA,DELAWARE,721,44,,7207000000.0,7773000000,,3962000000.0,4708000000,,2599000000,2738000000,,23000000.0,5000000.0,,4608000000.0,5035000000.0,,,,,2011000000,2215000000,,,,6144000000.0,5975000000.0,5646000000.0,780000000.0,730000000,261000000,653000000.0,329000000.0,136000000.0,673000000.0,90000000,-26000000,,,,,,,,,,,,,,,,,,,,,,410000000.0,-502000000,-365000000,-152000000.0,874000000.0,-171000000.0,-56000000.0,-624000000,488000000.0,179000000.0,142000000.0,202000000.0,,,,156000000.0,358000000.0,106000000.0,358000000.0,106000000.0,58000000,34.57,33.14,31.05,10.63,5.51,2.41,12.7,12.22,4.62,-7.56,80.53,111.71,10.95,1.51,-0.46,,,,,,,,,,,0.97,1.25,,1.97,2.13,,27.07,32.07,,,,,0.83,0.73
1,05-154-1597,"CHIQUITA BRANDS INTERNATIONAL, INC.",WWW.CHIQUITA.COM,1899,4192336,USA,FLORIDA,179,"2 ,",1697762000.0,1659138000.0,1612038000,680476000.0,629195000.0,583064000,1327360000.0,1284700000,1288704000,540517000.0,629353000.0,637518000.0,370402000.0,374438000.0,323334000.0,36.65,35.43,34.22,480332000.0,408578000,378944000,8.0,8.0,6.86,3078337000.0,3057482000.0,3090224000.0,-168458000.0,102749000,65525000,-220401000.0,49587000.0,24654000.0,-405017000.0,-15815000,-62536000,66.65,65.64,65.8,-8.75,-0.34,-1.33,-8.79,-0.34,-1.33,46317430.0,46829910.0,47112310.0,46059000.0,46577000.0,46963000.0,46059000.0,46577000.0,46963000.0,-8.79,-0.34,-1.33,32577000.0,91479000,53801000,-47639000.0,-50762000.0,-46761000.0,20827000.0,-37726000,-12897000.0,53440000.0,49054000.0,49651000.0,0.71,1.96,1.15,45261000.0,51026000.0,54017000.0,51026000.0,54017000.0,48160000,10.89,11.42,11.49,-7.16,1.62,0.8,-5.47,3.36,2.12,EBT<0,EBT<0,EBT<0,-13.16,-0.52,-2.02,,,,1.03,1.46,2.11,11.7,5.96,12.62,0.82,0.87,0.86,1.42,1.54,1.54,11.79,13.3,12.66,-0.45,0.91,0.09,1.81,1.84,1.92
2,19-699-1731,THE ANDERSONS INC,WWW.ANDERSONSINC.COM,1947,341562374,USA,OHIO,723,1858,2232849000.0,2162354000.0,2392003000,1058126000.0,999211000.0,1023198000,1458488000.0,1347152000,1561681000,397065000.0,418339000.0,496187000.0,774361000.0,815202000.0,830322000.0,79.1,76.23,83.95,799776000.0,738716000,833350000,27.43,28.74,29.14,3924790000.0,3686345000.0,3045382000.0,100279000.0,52619000,125063000,18004000.0,-39125000.0,37861000.0,11594000.0,42511000,41484000,138.83,131.07,107.77,0.41,1.5,1.46,0.41,1.5,1.46,28229000.0,28367000.0,28494000.0,28193000.0,28126000.0,28258000.0,28431000.0,28296000.0,28452000.0,0.41,1.51,1.47,39585000.0,75285000,-35519000,-28218000.0,-113494000.0,-185993000.0,-12487000.0,10498000,209186000.0,163008000.0,177622000.0,309584000.0,1.39,2.66,-1.25,63750000.0,62630000.0,34919000.0,62630000.0,34919000.0,22593000,8.8,8.65,9.92,0.46,-1.06,1.24,2.56,1.43,4.11,59.27,EBT<0,45.86,0.3,1.15,1.36,109.32,20.63,20.33,1.63,1.08,1.03,31.92,11.64,,0.31,0.28,0.27,1.32,1.35,1.23,11.57,12.05,7.94,-2.34,-2.33,-9.4,1.76,1.7,1.27
3,07-941-1785,"BRIGHTVIEW HOLDINGS, INC.",WWW.BRIGHTVIEW.COM,2 13,,USA,PENNSYLVANIA,781,19,2858620000.0,2891898000.0,2928600000,502521000.0,531165000.0,551400000,2162359000.0,1664571000,1644800000,1574882000.0,1141279000.0,1134200000.0,696261000.0,1227327000.0,1283800000.0,37.08,27.68,28.03,342149000.0,331470000,332700000,9.03,11.75,12.29,1713579000.0,2353603000.0,2404600000.0,198534000.0,197259000,263400000,49077000.0,39953000.0,129700000.0,-13955000.0,-15087000,44400000,29.73,28.23,23.39,-0.18,-0.18,0.43,-0.18,-0.18,0.43,77083000.0,104470000.0,104470000.0,77071000.0,83369000.0,102800000.0,77071000.0,83369000.0,103363000.0,-0.18,-0.18,0.43,78899000.0,180383000,169700000,-97462000.0,-179270000.0,-145500000.0,-36621000.0,21332000,-20300000.0,50633000.0,86425000.0,89900000.0,1.02,2.16,1.64,67963000.0,12779000.0,35200000.0,12779000.0,35224000.0,39100000,26.48,26.6,26.54,2.86,1.7,5.39,11.59,8.38,10.95,EBT<0,EBT<0,22.38,-0.81,-0.64,1.85,,,39.88,,1.37,1.4,,7.42,10.39,0.98,1.04,1.1,1.47,1.6,1.66,5.61,6.91,7.47,0.6,1.27,0.84,0.6,0.81,0.82
4,05-064-3436,"CAL-MAINE FOODS, INC.",WWW.CALMAINEFOODS.COM,1957,64 5 378,USA,MISSISSIPPI,252,3573,1033094000.0,1150447000.0,1156278000,436206000.0,587520000.0,567753000,190407000.0,197114000,169654000,6113000.0,2554000.0,641000.0,842687000.0,953333000.0,986624000.0,21.27,23.66,23.75,64679000.0,107838000,74907000,17.35,19.6,20.26,1074513000.0,1502932000.0,1361188000.0,-69669000.0,161488000,110395000,-128430000.0,103148000.0,45814000.0,-74278000.0,125932000,54229000,21.86,31.17,28.16,-1.54,2.6,1.12,-1.54,2.6,1.12,48577000.0,48631000.0,48694000.0,48362000.0,48353000.0,48467000.0,48362000.0,48468000.0,48589000.0,-1.54,2.6,1.12,-49316000.0,200415000,115085000,56132000.0,-163850000.0,-47817000.0,-18298000.0,-5698000,-46452000.0,66657000.0,19671000.0,67989000.0,-1.02,4.13,2.37,29046000.0,17564000.0,48431000.0,17564000.0,48431000.0,69247000,4.24,24.02,16.37,-11.95,6.86,3.37,-6.48,10.74,8.11,EBT<0,-7.78,23.84,-6.91,8.38,3.98,,17.95,32.96,2.22,2.39,1.83,,11.26,15.55,3.41,3.87,5.09,6.74,5.45,7.58,35.96,41.7,42.62,-2.36,3.77,1.01,1.04,1.31,1.18
5,61-925-0665,"HINES HORTICULTURE, INC.",WWW.HINESHORT.COM,192,33 411319,USA,CALIFORNIA,181,21,397729000.0,388135000.0,340368000,204174000.0,204287000.0,193333000,336763000.0,329727000,331126000,203571000.0,175000000.0,175000000.0,60966000.0,58408000.0,9242000.0,18.02,17.58,15.42,129540000.0,109469000,124074000,2.76,2.65,0.42,335168000.0,327913000.0,232570000.0,55437000.0,35904000,-1415000,38546000.0,20734000.0,-11403000.0,8236000.0,-2558000,-46472000,15.14,14.86,10.54,0.37,-0.12,-0.89,0.37,-0.12,-2.11,22072550.0,22072550.0,22072550.0,22072550.0,22072550.0,22072550.0,22121180.0,22072550.0,22072550.0,0.37,-0.12,-2.11,19115000.0,7074000,-12966000,-6541000.0,40423000.0,5997000.0,-12574000.0,-48035000,7015000.0,5869000.0,10258000.0,12034000.0,,,,,600000.0,62000.0,,62000.0,108000,49.07,46.76,41.64,11.5,6.32,-4.9,16.54,10.95,-0.61,41.32,EBT<0,EBT<0,2.46,-0.78,-19.98,,,,,,,,,,0.15,0.15,0.09,1.58,1.87,1.56,18.77,24.43,20.35,0.61,2.15,-1.13,0.84,0.84,0.68
6,00-896-5428,"DOLE FOOD COMPANY, INC.",WWW.DOLE.COM,1851,99 353,USA,CALIFORNIA,179,1534,4607994000.0,4642884000.0,4364619000,1663278000.0,1846514000.0,1987967000,4272782000.0,4317876000,3961719000,2315597000.0,2316208000.0,1798556000.0,335212000.0,325008000.0,402900000.0,4607994.0,4642884.0,4364619.0,977066000.0,1152732000,1456920000,335212.0,325008.0,402900.0,6171464000.0,6930965000.0,7619952000.0,254553000.0,283071000,395052000,85619000.0,130123000.0,247642000.0,-88983000.0,-57506000,121005000,,,,,,,,,,1000.0,1000.0,1000.0,,,,,,,,,,15921000.0,46322000,44563000,-117000000.0,-61383000.0,141142000.0,142832000.0,16045000,-185520000.0,125056000.0,106821000.0,85096000.0,,,,48812000.0,92414000.0,97061000.0,92414000.0,97061000.0,90829000,8.74,8.99,9.94,1.39,1.88,3.25,4.12,4.08,5.18,EBT<0,EBT<0,-51.9,-1.44,-0.83,1.59,,,,,,,,,,0.82,0.77,0.59,1.7,1.6,1.36,14.89,14.94,12.17,,,,1.34,1.49,1.75
7,01-807-6351,"MICHAEL FOODS, INC.",WWW.MICHAELFOODS.COM,1928,134151741,USA,MINNESOTA,252,3596,,1333576000.0,1263763000,,251869000.0,238502000,,1029561000,938969000,,706239000.0,644957000.0,,304015000.0,324794000.0,,444525.0,421254.0,,171946000,160144000,,101338.0,108265.0,1313504000.0,1242498000.0,1247348000.0,165097000.0,170791000,168948000,98240000.0,106247000.0,94090000.0,33514000.0,38859000,19155000,,,,,,,,,,3000.0,3000.0,3000.0,,,,,,,,,,121647000.0,104402000,76766000,-36381000.0,-41507000.0,-33904000.0,-99232000.0,-52562000,-63466000.0,37695000.0,40690000.0,33806000.0,,,,45594000.0,31816000.0,42179000.0,31816000.0,42179000.0,21576000,18.0,19.0,18.0,7.0,9.0,8.0,13.0,14.0,14.0,38,27,43,3.0,3.0,2.0,,,,,,,,,,,1.0,1.0,,1.0,1.0,,6.0,6.0,,,,,1.0,1.0
8,00-790-3180,THE DAVEY TREE EXPERT COMPANY,WWW.DAVEY.COM,19 9,34 17611,USA,OHIO,783,86,423939000.0,473135000.0,526623000,178773000.0,209125000.0,255068000,271760000.0,311745000,364213000,92290000.0,119210000.0,158425000.0,152179000.0,161390000.0,162410000.0,17.01,19.53,23.02,118905000.0,128657000,139312000,6.11,6.66,7.1,845678000.0,915958000.0,1024791000.0,90972000.0,95674000,101154000,40707000.0,43016000.0,50584000.0,22284000.0,22120000,27977000,32.17,35.84,42.02,0.82,0.83,1.1,0.82,0.83,1.1,24923140.0,24220900.0,22880650.0,26212000.0,25557470.0,24388740.0,27248000.0,26697060.0,25480620.0,0.85,0.87,1.15,55370000.0,56776000,62104000,-54808000.0,-59518000.0,-61377000.0,-7721000.0,6410000,9065000.0,56646000.0,57100000.0,60410000.0,2.03,2.13,2.44,16030000.0,9006000.0,13121000.0,9006000.0,13121000.0,22661000,35.97,35.88,35.07,4.81,4.7,4.94,10.76,10.45,9.87,40.17,41.78,25.39,2.64,2.41,2.73,,,,,,,,,,1.24,1.35,1.51,1.5,1.63,1.83,14.12,17.01,21.98,0.17,0.18,0.38,1.99,1.94,1.95
9,00-944-8200,POTLATCHDELTIC CORPORATION,WWW.POTLATCHDELTIC.COM,19 3,82 156 45,USA,WASHINGTON,831,953,927681000.0,953079000.0,2325852000,163645000.0,193307000.0,262198000,771407000.0,752537000,1011073000,572956000.0,559056000.0,715391000.0,156274000.0,200542000.0,1314779000.0,22.89,23.47,34.42,60581000.0,74798000,136284000,3.86,4.94,19.46,599099000.0,678595000.0,974579000.0,43854000.0,153623000,200106000,84076000.0,144435000.0,184954000.0,10938000.0,86453000,122880000,14.64,16.62,16.1,0.27,2.1,1.99,0.27,2.1,1.99,40519350.0,40611990.0,67569800.0,40797810.0,40824000.0,60533620.0,41033440.0,41227000.0,61813720.0,0.27,2.12,2.03,102117000.0,162659000,178894000,93351000.0,-50020000.0,-47909000.0,-120809000.0,-74766000,-172001000.0,7110000.0,34898000.0,34757000.0,2.49,3.95,2.89,7925000.0,82584000.0,120457000.0,82584000.0,120457000.0,79441000,22.83,30.69,27.39,14.03,21.28,18.98,7.32,22.64,20.53,-65.4,27.03,13.51,1.83,12.74,12.61,154.68,23.54,15.59,10.8,10.11,1.63,16.69,12.52,10.71,1.52,1.66,0.66,2.7,2.58,1.92,11.11,12.43,5.41,5.05,3.13,2.38,0.65,0.71,0.42


In [23]:
sic0.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 38 entries, 0 to 37
Columns: 126 entries, D-U-N-S@ Number to Year1 Revenue to Assets
dtypes: float64(100), int64(15), object(11)
memory usage: 37.5+ KB


In [24]:
%%time
list_of_dfs = [sic0,sic1,sic2,sic3,sic4,sic5,sic6,sic7,sic8,sic9]

data = pd.DataFrame(pd.concat(list_of_dfs, ignore_index=True))
# write DataFrame to an excel sheet 
data.to_excel('/Users/Brandon/Documents/GitHub/COMPS/Clean Data/appended.xlsx')

Wall time: 12.5 s


In [25]:
data.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 9987 entries, 0 to 9986
Columns: 126 entries, D-U-N-S@ Number to Year1 Revenue to Assets
dtypes: float64(105), object(21)
memory usage: 9.6+ MB


In [27]:
data.dtypes

D-U-N-S@ Number                    object
Company Name                       object
URL                                object
Founding                           object
EIN                                object
                                   ...   
Year2 Free Cash Flow per Share    float64
Year1 Free Cash Flow per Share    float64
Year3 Revenue to Assets           float64
Year2 Revenue to Assets           float64
Year1 Revenue to Assets           float64
Length: 126, dtype: object