In [1]:
import os

# data frame basics
import pandas as pd
import numpy as np

# visualization basics
import matplotlib.pyplot as plt
import seaborn as sns

# math basics
from math import log
from scipy import stats, linalg

# Scikit learn Models and Selector Algos
from sklearn import neighbors
from sklearn.linear_model import LogisticRegression
from sklearn.ensemble import RandomForestClassifier

from sklearn.feature_selection import RFE
from sklearn.linear_model import LogisticRegression
from sklearn.model_selection import RandomizedSearchCV
from sklearn.model_selection import GridSearchCV



# Scikit learn metrics and reporting
from sklearn import metrics
from sklearn.metrics import confusion_matrix
from sklearn.metrics import classification_report
from sklearn.metrics import mean_squared_error 

# stuff to change, process, oversample data
from sklearn import preprocessing 
from imblearn.over_sampling import SMOTE
from sklearn.preprocessing import Imputer
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import StandardScaler


import warnings
warnings.filterwarnings('ignore')

# old statsmodel stuf
import statsmodels.api as sm
import statsmodels.formula.api as smf
import patsy


# magics

%matplotlib inline


  from numpy.core.umath_tests import inner1d


In [2]:
pd.set_option('display.max_columns', None)
pd.set_option('display.max_rows', None)

In [5]:
df = pd.read_csv('../data/model_data_india.csv', low_memory= False)
df = df.drop(columns = 'Unnamed: 0')
df.head(10)

Unnamed: 0,sa_total_income,sa_sales,sa_total_assets,sa_pat,sa_total_liabilities,sa_gross_working_capital_cosm,sa_current_assets_incl_st_invest_loans,sa_current_liabilities,sa_cash_bal,sa_st_trade_bills_receivables,sa_debtors_more_6m,sa_st_trade_receivables,sa_nf_operating_expenses,sa_f_operating_expenses,sa_dep_owned_ast,sa_retained_profits,sa_pbit,sa_interest_inc,sa_interest_exp,sa_st_inventories,sa_pbdita_net_of_peoifi,sa_pbpt_net_of_peoi,sa_total_capital,sa_gross_fixed_assets,sa_pbdita,sa_cost_of_goods_sold,sa_cost_of_sales,sa_total_expense,sa_net_sales,sa_depreciation,sa_non_current_assets,sa_net_fixed_assets,sa_gross_fixed_assets.1,sa_non_fin_services_inc,sa_inc_fin_serv,sa_net_working_capital,sa_non_current_liabilities,sa_tot_inc_net_of_pe,sa_sales_n_chg_in_stk,sa_chg_in_assets_with_no_chg_in_efficiency,sa_chg_in_efficiency_with_no_chg_in_assets,sa_chg_in_efficiency_on_chg_in_assets,sa_reported_pat,sa_diff_in_pat,sa_pbpt,sa_pbt,sa_pbit_net_of_peoifi,sa_cash_profit,sa_equity_div_inc_dist_pc_pat,sa_sales_net_fixed_assets,sa_total_income_avg_tot_asset_net_miscexp_now_reval,sa_chg_in_efficiency_in_use_of_assets,sa_pc_chg_in_efficiency_with_no_chg_in_assets,sa_pc_chg_in_assets_with_no_chg_in_efficiency,sa_pc_chg_in_efficiency_on_chg_in_assets,sa_total_div_pc_pat,sa_total_interest_exp,sa_nf_oper_exp_pc_total_exp,sa_f_oper_exp_pc_total_exp,sa_fin_serv_exp_pc_total_exp,sa_pbpt_net_of_peoi_inc_fin_serv,sa_pat_cont_ops_pc_inc_cont_ops,sa_pat_discont_ops_pc_inc_discont_ops,sa_total_provisions_pc_pbdita,sa_write_offs_pc_pbdita,sa_depreciation_pc_pbdita,sa_amortisation_pc_pbdita,sa_fin_serv_exp_pc_pbdita,sa_prov_direct_tax_pc_pbdita,sa_pat_pc_pbdita,sa_pbdita_pc_total_inc,sa_pbt_pc_total_inc,sa_pat_pc_total_inc,sa_cash_profit_pc_total_inc,sa_pat_net_of_pe_pc_tot_inc_net_of_pe,sa_pat_net_of_pe_pc_avg_networth,sa_pat_pc_avg_networth,sa_cash_profit_pc_avg_networth,sa_pbpt_net_of_peoi_pc_avg_capital_employed,sa_pat_net_of_pe_pc_avg_capital_employed,sa_pat_pc_avg_capital_employed,sa_pat_net_of_pe_pc_avg_tot_asset_net_menow_reval,sa_pc_chg_in_profitability_with_no_chg_in_income,sa_st_trade_bills_receivables_pc_current_assets_incl_st_invest_loans,sa_quick_ratio,sa_current_ratio,sa_debt_equity,sa_cash_n_bank_no_fd_security_current_liab_n_prov,sa_cash_n_bank_no_fd_security_cost_of_sales_per_day,sa_rawmat_stores_spares_avg_stk_rawmat_stores,sa_cost_of_goods_sold_avg_stk_fg,sa_sales_avg_debtors,sa_creditors_turnover,sa_total_inc_net_of_pe_compensation_to_empl,sa_sales_avg_gfa_net_of_reval,sa_sales_net_repairs_avg_nfa_net_of_reval,delisted
0,3741.8,3729.3,3661.4,131.6,3661.4,1606.7038,1557.9,1399.7,1.6,548.6,,548.6,3177.5,3405.7,89.8,131.6,429.8,5.6,216.8,591.7,509.0,196.6,176.4,2384.5,519.6,2360.19,3319.6,3567.4,3569.9,89.8,2103.5,1560.3,2384.5,18.5,5.6,-40.0,901.1,3738.3,3686.5,198.5575,14.809,0.8336,131.6,0.0,201.6,193.2,419.2,247.7,0.0,239.0117,1.0683,1.1476,6.9136,92.6972,1.2432,0.0,216.8,89.0705,95.4673,6.3968,35.1071,3.517,0.0,1.5012,0.1155,17.2825,0.0,43.9184,11.8553,25.3272,13.8864,5.1633,3.517,6.6198,3.4775,12.9039,13.0627,24.5868,7.8308,5.178,5.2418,3.7114,75.0796,35.2141,0.517,0.9745,1.2375,0.0499,10.7094,3.9417,12.2575,6.7237,4.0576,11.3042,1.6411,2.5176,0
1,1330.2,1314.2,784.4,-164.6,784.4,427.8439,531.2,363.0,7.1,356.7,154.4,356.7,1316.5,1363.3,27.4,-164.6,-12.1,3.8,43.5,6.7,-0.7,-71.0,54.1,624.0,15.3,1204.75,1344.2,1496.4,1282.6,27.4,253.2,222.8,624.0,1194.9,3.9,85.3,143.5,1319.8,1315.8,-205.8565,151.4126,-22.1561,-165.2,0.6,-58.9,-177.5,-28.1,-32.1,,589.8564,1.5181,0.51,-197.6666,268.7421,42.7933,,43.5,87.9778,91.1053,3.1275,-18.2051,-12.3741,0.0,0.0,775.1634,179.085,0.0,305.8824,-84.3137,-1075.817,1.1502,-13.3439,-12.3741,-2.4132,-13.2596,-47.2781,-44.4685,-8.6722,-10.1371,-24.9857,-23.5009,-19.9715,103.403,67.1498,1.1895,1.2312,1.2151,0.0661,7.1143,0.0,276.954,3.1779,18.1519,13.3854,2.0404,5.3674,0
2,1428.0,1423.1,365.3,6.2,365.3,193.9525,318.2,152.1,0.1,160.4,,160.4,1447.6,1450.2,2.4,6.2,11.9,3.1,1.0,33.9,9.4,7.5,117.6,40.1,14.3,1385.4,1416.1,1455.7,1423.1,2.4,47.1,18.7,40.1,1423.1,3.1,125.8,1.3,1426.3,1457.0,-143.8839,546.4505,-71.6666,6.2,0.0,9.3,9.3,7.0,8.6,0.0,7610.1604,3.5307,-5.4201,165.1407,-43.4826,-21.9672,0.0,1.0,99.4436,99.6222,0.1786,2.4194,0.4342,0.0,0.0,0.0,16.7832,0.0,18.1818,21.6783,43.3566,1.0014,0.6513,0.4342,0.6022,0.3155,2.6239,3.6152,5.0146,2.1555,1.2933,1.7819,1.1126,449.1552,50.4085,1.452,1.6642,0.7646,0.3173,15.4908,,81.7345,8.0175,1085.9231,185.2338,35.9369,77.5531,0
3,1125.8,1096.7,2048.2,183.3,2048.2,136.0677,1493.4,34.2,0.6,154.4,,154.4,814.1,816.6,26.7,153.2,284.8,20.5,0.2,,282.6,281.3,102.4,502.7,311.5,534.93,828.8,942.5,944.0,26.7,554.8,476.9,502.7,1096.7,27.9,866.6,97.5,1125.8,1096.7,362.0622,-89.3067,-36.3555,183.3,0.0,282.3,282.3,255.9,209.2,13.6388,229.9644,0.7087,0.5144,-37.7778,153.1566,-12.1414,13.6388,0.2,86.3767,86.6419,0.2653,10.0824,16.2818,0.0,0.0,0.0,8.5714,0.0,0.8026,31.7817,58.8443,27.6692,25.0755,16.2818,18.5823,16.2995,15.6343,15.6173,17.824,23.9669,15.6343,15.6173,11.5511,-426.6507,10.3388,2.278,2.4256,0.0,0.9916,213.7681,,,6.0911,10.5663,3.7328,2.6376,2.9331,0
4,87.4,86.9,154.0,-5.7,154.0,10.7811,20.4,19.5,0.1,19.6,,19.6,68.8,68.8,26.8,-5.7,-8.2,0.5,,,18.1,-8.2,91.6,253.8,18.6,91.54,95.6,93.1,86.9,26.8,133.6,46.3,253.8,86.9,0.5,-15.5,,87.4,86.9,-8.1316,-60.9009,3.2325,-5.7,0.0,-8.2,-8.2,-8.7,18.5,,187.689,0.5599,7.52,92.5546,12.3581,-4.8723,,,73.899,73.899,0.0,-16.4,-6.5217,0.0,0.0,0.0,144.086,0.0,0.0,-13.4409,-30.6452,21.2815,-9.3822,-6.5217,21.167,-6.5217,-4.7049,-4.7049,15.2703,-6.7685,-4.7049,-4.7049,-3.6515,-376.8116,96.0784,0.5658,0.5658,0.0,0.0084,1.1454,,,8.8673,3.5266,54.625,0.3425,1.4568,0
5,146.4,140.4,265.9,2.1,265.9,48.0659,221.6,102.4,0.1,96.9,,96.9,139.0,139.3,,2.1,3.1,6.0,,37.6,-2.9,2.8,110.5,0.2,3.1,136.8,139.0,140.0,140.2,,44.3,0.2,0.2,136.0,6.0,116.4,,146.4,136.1,3.1351,102.3833,30.2815,2.1,0.0,2.8,2.8,-2.9,2.8,0.0,70200.0,0.6737,2.7379,75.3927,2.3086,23.4094,0.0,,99.2857,99.5,0.2143,0.4667,1.4344,0.0,0.0,0.0,0.0,0.0,9.6774,22.5806,67.7419,2.1175,1.9126,1.4344,1.9126,1.4344,1.2923,1.2923,1.7231,1.7231,1.2923,1.2923,0.9664,2.6025,43.7274,0.96,2.1367,0.0,0.0078,2.1007,,,2.8919,2.7959,58.56,702.0,702.0,0
6,1615.7,1605.2,1941.9,107.2,1941.9,2164.6327,1641.7,1187.2,0.3,788.0,205.1,788.0,1112.7,1263.3,35.7,93.5,332.4,8.5,128.1,475.6,357.6,179.8,91.4,443.8,368.1,872.87,1280.0,1373.6,1605.0,35.7,300.2,286.6,443.8,1577.0,8.5,109.4,141.7,1615.7,1470.3,314.3433,34.2121,8.5447,107.2,0.0,181.8,159.1,321.9,168.3,10.6343,560.0837,0.8691,0.9612,9.5805,88.0267,2.8964,10.6343,128.1,81.0061,91.97,10.9639,21.1529,6.6349,0.0,0.0,6.1668,9.6985,0.0,40.9128,14.0994,29.1225,22.7827,9.8471,6.6349,10.4165,6.6349,22.174,22.174,34.8123,12.175,7.2589,7.2589,5.7667,26.4186,47.999,0.7007,1.0862,1.9358,0.0267,9.6668,,7.8109,2.3447,2.2887,5.2732,3.7952,5.6651,0
7,1724.2,1665.8,2424.3,123.7,2424.3,581.9771,905.7,173.5,5.6,314.2,1.1,314.2,1457.9,1467.3,71.2,123.7,204.2,2.6,3.6,265.0,217.4,182.9,215.8,1327.0,275.4,1107.02,1514.5,1610.0,1652.7,71.2,1518.6,668.7,1327.0,137.2,46.1,673.8,291.4,1718.3,1675.3,60.3884,13.2275,0.4841,123.7,0.0,194.8,190.0,146.2,196.4,0.0,249.1102,0.7099,0.8641,17.8509,81.4958,2.6535,0.0,3.6,90.5528,91.1366,0.5839,3.9675,7.1743,0.0,0.0,1.7429,25.8533,0.0,3.4132,24.0741,44.9165,15.9726,11.0196,7.1743,11.3908,6.8789,6.1385,6.4241,10.1997,9.1933,5.9412,6.2176,4.8665,117.8332,34.6914,3.0543,4.8481,0.0282,0.8909,22.7748,20.5036,41.1532,5.3212,10.8544,12.4695,1.2729,2.4309,0
8,61.2,55.2,84.8,-5.2,84.8,84.1312,54.9,53.1,0.2,19.6,5.1,19.6,44.3,49.8,1.6,-5.2,-0.6,1.0,4.4,21.3,-4.6,-10.5,22.4,23.1,1.0,43.83,61.4,50.9,55.0,1.6,29.9,13.8,23.1,39.9,1.2,-3.2,12.4,61.1,39.7,8.2914,-61.6895,-4.3019,-5.2,0.0,-6.1,-6.3,-6.2,-4.6,,400.0,0.5428,-7.8503,106.9143,-14.3699,7.2018,,4.4,87.0334,97.8389,10.8055,-8.75,-8.4967,0.0,0.0,20.0,160.0,0.0,550.0,-110.0,-520.0,1.634,-10.2941,-8.4967,-7.5163,-8.0196,-22.3744,-23.7443,-21.0046,-16.1043,-7.5153,-7.9755,-4.3459,139.9599,35.7013,0.4275,0.9397,2.1813,0.0452,79.658,,1.5088,1.4136,0.4841,3.0099,2.3691,2.8716,0
9,18.4,0.2,108.6,12.3,108.6,732.875,106.5,66.3,0.9,44.1,4.6,44.1,5.0,5.5,0.5,12.3,12.9,0.3,0.1,36.9,-4.8,12.4,40.0,2.7,13.4,2.14,5.5,6.1,0.2,0.5,2.1,2.1,2.7,0.2,18.2,40.2,1.1,18.4,0.2,106.4068,-170.8769,-99.6299,12.3,0.0,12.4,12.4,-5.3,12.8,0.0,9.5238,0.2627,-6.3605,104.1297,-64.8426,60.0734,0.0,0.1,81.9672,90.1639,8.1967,0.6813,66.8478,0.0,0.0,0.0,3.7313,0.0,3.7313,0.7463,91.791,72.8261,67.3913,66.8478,69.5652,66.8478,35.0927,35.0927,36.5193,31.5924,31.3376,31.3376,17.5589,1014.144,41.4085,0.6848,1.6063,0.1699,0.0151,66.3636,,,0.0075,0.0133,12.2667,0.1429,0.1818,0


In [6]:
df['sa_gross_profit'] = df['sa_total_income'] - df['sa_total_expense']
df['X1'] = df['sa_pat']/df['sa_total_assets']
df['X2'] = df['sa_total_liabilities']/df['sa_total_assets']
df['X3'] = df['sa_gross_working_capital_cosm']/df['sa_total_assets']
df['X4'] = df['sa_current_assets_incl_st_invest_loans']/df['sa_current_liabilities']
df['X6'] = df['sa_retained_profits']/df['sa_total_assets']
df['X7'] = df['sa_pbit']/df['sa_total_assets']
df['X9'] = df['sa_sales']/df['sa_total_assets']
df['X12'] = df['sa_gross_profit'] / df['sa_current_liabilities']
df['X13'] = (df['sa_gross_profit'] + df['sa_depreciation'])/df['sa_sales']
df['X13'] = (df['sa_gross_profit'] + df['sa_depreciation'])/df['sa_sales']
df['X14'] = df['sa_gross_profit'] +df['sa_interest_inc']/df['sa_total_assets']
df['X15'] = (df['sa_total_liabilities']*365)/(df['sa_gross_profit'] +df['sa_depreciation'])
df['X16'] = (df['sa_gross_profit'] +df['sa_depreciation'])/df['sa_total_liabilities']
df['X17'] = df['sa_gross_profit']/df['sa_total_liabilities']

In [7]:
df['X18'] = df['sa_gross_profit']/df['sa_total_assets']
df['X19'] = df['sa_gross_profit']/df['sa_sales']
df['X20'] = (df['sa_st_inventories']*365)/df['sa_sales']
df['X23'] = df['sa_pat']/df['sa_sales']
df['X26'] = (df['sa_pat'] + df['sa_depreciation'])/ df['sa_total_liabilities']
df['X28'] = df['sa_gross_working_capital_cosm']/df['sa_gross_fixed_assets'] 
df['X29'] = np.log(df['sa_total_assets'])
df['X30'] = (df['sa_total_liabilities'] - df['sa_cash_bal'])/df['sa_sales']
df['X31'] = (df['sa_gross_profit'] + df['sa_interest_inc'])/df['sa_sales']
df['X32'] = (df['sa_current_liabilities'] *365)/df['sa_cost_of_goods_sold']
df['X33'] = (df['sa_nf_operating_expenses']+df['sa_f_operating_expenses'])/df['sa_current_liabilities']
df['X34'] = (df['sa_nf_operating_expenses']+df['sa_f_operating_expenses'])/df['sa_total_liabilities']
df['X35'] = df['sa_pbt']/df['sa_total_assets']
df['X36'] = df['sa_sales'] /df['sa_total_assets']
df['X37'] = (df['sa_current_assets_incl_st_invest_loans'] - df['sa_st_inventories'])/ \
(df['sa_total_liabilities']-df['sa_current_liabilities'])
df['X38'] = df['sa_total_capital'] /df['sa_total_assets']
df['X40'] = (df['sa_current_ratio'] - df['sa_st_inventories'] - df['sa_st_trade_receivables'])/df['sa_current_liabilities']
df['X44'] = df['sa_st_trade_receivables']*365/df['sa_sales']
df['X45'] = df['sa_pat']/df['sa_st_inventories']
df['X46'] = (df['sa_current_liabilities'] - df['sa_st_inventories'])/df['sa_current_liabilities']
df['X47'] = (df['sa_st_inventories']*365)/df['sa_cost_of_goods_sold']
df['X48'] =  df['sa_pbdita']/df['sa_total_assets']
df['X49'] = df['sa_pbdita']/df['sa_sales']
df['X50'] = df['sa_current_assets_incl_st_invest_loans']/df['sa_total_liabilities']
df['X51'] = df['sa_current_liabilities']/df['sa_total_assets']
df['X52'] = (df['sa_current_liabilities'] * 365)/df['sa_cost_of_goods_sold']
df['X54'] = df['sa_total_capital']/df['sa_gross_fixed_assets']
df['X56'] = (df['sa_sales'] - df['sa_cost_of_goods_sold'])/df['sa_sales']
df['X58'] = df['sa_total_expense']/df['sa_sales']
df['X60'] = df['sa_sales']/df['sa_st_inventories']
df['X61'] = df['sa_sales']/df['sa_st_trade_receivables']
df['X62'] = (df['sa_current_liabilities'] *365)/df['sa_sales']
df['X63'] =df['sa_sales']/df['sa_current_liabilities']
df['X64'] =df['sa_sales']/df['sa_gross_fixed_assets']

In [8]:
df.head(30)

Unnamed: 0,sa_total_income,sa_sales,sa_total_assets,sa_pat,sa_total_liabilities,sa_gross_working_capital_cosm,sa_current_assets_incl_st_invest_loans,sa_current_liabilities,sa_cash_bal,sa_st_trade_bills_receivables,sa_debtors_more_6m,sa_st_trade_receivables,sa_nf_operating_expenses,sa_f_operating_expenses,sa_dep_owned_ast,sa_retained_profits,sa_pbit,sa_interest_inc,sa_interest_exp,sa_st_inventories,sa_pbdita_net_of_peoifi,sa_pbpt_net_of_peoi,sa_total_capital,sa_gross_fixed_assets,sa_pbdita,sa_cost_of_goods_sold,sa_cost_of_sales,sa_total_expense,sa_net_sales,sa_depreciation,sa_non_current_assets,sa_net_fixed_assets,sa_gross_fixed_assets.1,sa_non_fin_services_inc,sa_inc_fin_serv,sa_net_working_capital,sa_non_current_liabilities,sa_tot_inc_net_of_pe,sa_sales_n_chg_in_stk,sa_chg_in_assets_with_no_chg_in_efficiency,sa_chg_in_efficiency_with_no_chg_in_assets,sa_chg_in_efficiency_on_chg_in_assets,sa_reported_pat,sa_diff_in_pat,sa_pbpt,sa_pbt,sa_pbit_net_of_peoifi,sa_cash_profit,sa_equity_div_inc_dist_pc_pat,sa_sales_net_fixed_assets,sa_total_income_avg_tot_asset_net_miscexp_now_reval,sa_chg_in_efficiency_in_use_of_assets,sa_pc_chg_in_efficiency_with_no_chg_in_assets,sa_pc_chg_in_assets_with_no_chg_in_efficiency,sa_pc_chg_in_efficiency_on_chg_in_assets,sa_total_div_pc_pat,sa_total_interest_exp,sa_nf_oper_exp_pc_total_exp,sa_f_oper_exp_pc_total_exp,sa_fin_serv_exp_pc_total_exp,sa_pbpt_net_of_peoi_inc_fin_serv,sa_pat_cont_ops_pc_inc_cont_ops,sa_pat_discont_ops_pc_inc_discont_ops,sa_total_provisions_pc_pbdita,sa_write_offs_pc_pbdita,sa_depreciation_pc_pbdita,sa_amortisation_pc_pbdita,sa_fin_serv_exp_pc_pbdita,sa_prov_direct_tax_pc_pbdita,sa_pat_pc_pbdita,sa_pbdita_pc_total_inc,sa_pbt_pc_total_inc,sa_pat_pc_total_inc,sa_cash_profit_pc_total_inc,sa_pat_net_of_pe_pc_tot_inc_net_of_pe,sa_pat_net_of_pe_pc_avg_networth,sa_pat_pc_avg_networth,sa_cash_profit_pc_avg_networth,sa_pbpt_net_of_peoi_pc_avg_capital_employed,sa_pat_net_of_pe_pc_avg_capital_employed,sa_pat_pc_avg_capital_employed,sa_pat_net_of_pe_pc_avg_tot_asset_net_menow_reval,sa_pc_chg_in_profitability_with_no_chg_in_income,sa_st_trade_bills_receivables_pc_current_assets_incl_st_invest_loans,sa_quick_ratio,sa_current_ratio,sa_debt_equity,sa_cash_n_bank_no_fd_security_current_liab_n_prov,sa_cash_n_bank_no_fd_security_cost_of_sales_per_day,sa_rawmat_stores_spares_avg_stk_rawmat_stores,sa_cost_of_goods_sold_avg_stk_fg,sa_sales_avg_debtors,sa_creditors_turnover,sa_total_inc_net_of_pe_compensation_to_empl,sa_sales_avg_gfa_net_of_reval,sa_sales_net_repairs_avg_nfa_net_of_reval,delisted,sa_gross_profit,X1,X2,X3,X4,X6,X7,X9,X12,X13,X14,X15,X16,X17,X18,X19,X20,X23,X26,X28,X29,X30,X31,X32,X33,X34,X35,X36,X37,X38,X40,X44,X45,X46,X47,X48,X49,X50,X51,X52,X54,X56,X58,X60,X61,X62,X63,X64
0,3741.8,3729.3,3661.4,131.6,3661.4,1606.7038,1557.9,1399.7,1.6,548.6,,548.6,3177.5,3405.7,89.8,131.6,429.8,5.6,216.8,591.7,509.0,196.6,176.4,2384.5,519.6,2360.19,3319.6,3567.4,3569.9,89.8,2103.5,1560.3,2384.5,18.5,5.6,-40.0,901.1,3738.3,3686.5,198.5575,14.809,0.8336,131.6,0.0,201.6,193.2,419.2,247.7,0.0,239.0117,1.0683,1.1476,6.9136,92.6972,1.2432,0.0,216.8,89.0705,95.4673,6.3968,35.1071,3.517,0.0,1.5012,0.1155,17.2825,0.0,43.9184,11.8553,25.3272,13.8864,5.1633,3.517,6.6198,3.4775,12.9039,13.0627,24.5868,7.8308,5.178,5.2418,3.7114,75.0796,35.2141,0.517,0.9745,1.2375,0.0499,10.7094,3.9417,12.2575,6.7237,4.0576,11.3042,1.6411,2.5176,0,174.4,0.035943,1.0,0.438822,1.113024,0.035943,0.117387,1.018545,0.124598,0.070844,174.401529,5058.33081,0.072158,0.047632,0.047632,0.046765,57.911807,0.035288,0.060469,0.673812,8.205601,0.981364,0.048266,216.461598,4.703294,1.798001,0.052767,1.018545,0.427201,0.048178,-0.813978,53.693455,0.22241,0.577267,91.505557,0.141913,0.139329,0.425493,0.382285,216.461598,0.073978,0.367123,0.956587,6.302687,6.797849,136.993672,2.664357,1.563976
1,1330.2,1314.2,784.4,-164.6,784.4,427.8439,531.2,363.0,7.1,356.7,154.4,356.7,1316.5,1363.3,27.4,-164.6,-12.1,3.8,43.5,6.7,-0.7,-71.0,54.1,624.0,15.3,1204.75,1344.2,1496.4,1282.6,27.4,253.2,222.8,624.0,1194.9,3.9,85.3,143.5,1319.8,1315.8,-205.8565,151.4126,-22.1561,-165.2,0.6,-58.9,-177.5,-28.1,-32.1,,589.8564,1.5181,0.51,-197.6666,268.7421,42.7933,,43.5,87.9778,91.1053,3.1275,-18.2051,-12.3741,0.0,0.0,775.1634,179.085,0.0,305.8824,-84.3137,-1075.817,1.1502,-13.3439,-12.3741,-2.4132,-13.2596,-47.2781,-44.4685,-8.6722,-10.1371,-24.9857,-23.5009,-19.9715,103.403,67.1498,1.1895,1.2312,1.2151,0.0661,7.1143,0.0,276.954,3.1779,18.1519,13.3854,2.0404,5.3674,0,-166.2,-0.209842,1.0,0.545441,1.463361,-0.209842,-0.015426,1.675421,-0.457851,-0.105616,-166.195156,-2062.723343,-0.176951,-0.211882,-0.211882,-0.126465,1.860828,-0.125247,-0.174911,0.685647,6.664919,0.591462,-0.123573,109.977174,7.382369,3.416369,-0.226288,1.675421,1.244661,0.06897,-0.99771,99.068254,-24.567164,0.981543,2.029882,0.019505,0.011642,0.677206,0.462774,109.977174,0.086699,0.083283,1.138639,196.149254,3.684329,100.817988,3.620386,2.10609
2,1428.0,1423.1,365.3,6.2,365.3,193.9525,318.2,152.1,0.1,160.4,,160.4,1447.6,1450.2,2.4,6.2,11.9,3.1,1.0,33.9,9.4,7.5,117.6,40.1,14.3,1385.4,1416.1,1455.7,1423.1,2.4,47.1,18.7,40.1,1423.1,3.1,125.8,1.3,1426.3,1457.0,-143.8839,546.4505,-71.6666,6.2,0.0,9.3,9.3,7.0,8.6,0.0,7610.1604,3.5307,-5.4201,165.1407,-43.4826,-21.9672,0.0,1.0,99.4436,99.6222,0.1786,2.4194,0.4342,0.0,0.0,0.0,16.7832,0.0,18.1818,21.6783,43.3566,1.0014,0.6513,0.4342,0.6022,0.3155,2.6239,3.6152,5.0146,2.1555,1.2933,1.7819,1.1126,449.1552,50.4085,1.452,1.6642,0.7646,0.3173,15.4908,,81.7345,8.0175,1085.9231,185.2338,35.9369,77.5531,0,-27.7,0.016972,1.0,0.53094,2.092045,0.016972,0.032576,3.895702,-0.182117,-0.017778,-27.691514,-5270.13834,-0.069258,-0.075828,-0.075828,-0.019465,8.694751,0.004357,0.023542,4.836721,5.900719,0.256623,-0.017286,40.072542,19.05194,7.932658,0.025459,3.895702,1.33349,0.321927,-1.266508,41.139765,0.182891,0.77712,8.931356,0.039146,0.010048,0.871065,0.41637,40.072542,2.932668,0.026491,1.022908,41.979351,8.872195,39.010962,9.356345,35.488778
3,1125.8,1096.7,2048.2,183.3,2048.2,136.0677,1493.4,34.2,0.6,154.4,,154.4,814.1,816.6,26.7,153.2,284.8,20.5,0.2,,282.6,281.3,102.4,502.7,311.5,534.93,828.8,942.5,944.0,26.7,554.8,476.9,502.7,1096.7,27.9,866.6,97.5,1125.8,1096.7,362.0622,-89.3067,-36.3555,183.3,0.0,282.3,282.3,255.9,209.2,13.6388,229.9644,0.7087,0.5144,-37.7778,153.1566,-12.1414,13.6388,0.2,86.3767,86.6419,0.2653,10.0824,16.2818,0.0,0.0,0.0,8.5714,0.0,0.8026,31.7817,58.8443,27.6692,25.0755,16.2818,18.5823,16.2995,15.6343,15.6173,17.824,23.9669,15.6343,15.6173,11.5511,-426.6507,10.3388,2.278,2.4256,0.0,0.9916,213.7681,,,6.0911,10.5663,3.7328,2.6376,2.9331,0,183.3,0.089493,1.0,0.066433,43.666667,0.074797,0.139049,0.535446,5.359649,0.191484,183.310009,3559.966667,0.102529,0.089493,0.089493,0.167138,,0.167138,0.102529,0.270674,7.624717,1.867056,0.18583,23.335764,47.681287,0.796162,0.137828,0.535446,,0.049995,,51.386888,,,,0.152085,0.284034,0.729128,0.016698,23.335764,0.2037,0.512237,0.859396,,7.102979,11.382329,32.067251,2.181619
4,87.4,86.9,154.0,-5.7,154.0,10.7811,20.4,19.5,0.1,19.6,,19.6,68.8,68.8,26.8,-5.7,-8.2,0.5,,,18.1,-8.2,91.6,253.8,18.6,91.54,95.6,93.1,86.9,26.8,133.6,46.3,253.8,86.9,0.5,-15.5,,87.4,86.9,-8.1316,-60.9009,3.2325,-5.7,0.0,-8.2,-8.2,-8.7,18.5,,187.689,0.5599,7.52,92.5546,12.3581,-4.8723,,,73.899,73.899,0.0,-16.4,-6.5217,0.0,0.0,0.0,144.086,0.0,0.0,-13.4409,-30.6452,21.2815,-9.3822,-6.5217,21.167,-6.5217,-4.7049,-4.7049,15.2703,-6.7685,-4.7049,-4.7049,-3.6515,-376.8116,96.0784,0.5658,0.5658,0.0,0.0084,1.1454,,,8.8673,3.5266,54.625,0.3425,1.4568,0,-5.7,-0.037013,1.0,0.070007,1.046154,-0.037013,-0.053247,0.564286,-0.292308,0.242808,-5.696753,2663.981043,0.137013,-0.037013,-0.037013,-0.065593,,-0.065593,0.137013,0.042479,5.036953,1.771001,-0.059839,77.752895,7.05641,0.893506,-0.053247,0.564286,,0.594805,,82.324511,,,,0.120779,0.214039,0.132468,0.126623,77.752895,0.360914,-0.053395,1.071346,,4.433673,81.904488,4.45641,0.342396
5,146.4,140.4,265.9,2.1,265.9,48.0659,221.6,102.4,0.1,96.9,,96.9,139.0,139.3,,2.1,3.1,6.0,,37.6,-2.9,2.8,110.5,0.2,3.1,136.8,139.0,140.0,140.2,,44.3,0.2,0.2,136.0,6.0,116.4,,146.4,136.1,3.1351,102.3833,30.2815,2.1,0.0,2.8,2.8,-2.9,2.8,0.0,70200.0,0.6737,2.7379,75.3927,2.3086,23.4094,0.0,,99.2857,99.5,0.2143,0.4667,1.4344,0.0,0.0,0.0,0.0,0.0,9.6774,22.5806,67.7419,2.1175,1.9126,1.4344,1.9126,1.4344,1.2923,1.2923,1.7231,1.7231,1.2923,1.2923,0.9664,2.6025,43.7274,0.96,2.1367,0.0,0.0078,2.1007,,,2.8919,2.7959,58.56,702.0,702.0,0,6.4,0.007898,1.0,0.180767,2.164062,0.007898,0.011659,0.528018,0.0625,,6.422565,,,0.024069,0.024069,0.045584,97.749288,0.014957,,240.3295,5.58312,1.893162,0.088319,273.216374,2.717773,1.046634,0.01053,0.528018,1.125382,0.41557,-1.29261,251.912393,0.055851,0.632813,100.321637,0.011659,0.02208,0.833396,0.385107,273.216374,552.5,0.025641,0.997151,3.734043,1.448916,266.210826,1.371094,702.0
6,1615.7,1605.2,1941.9,107.2,1941.9,2164.6327,1641.7,1187.2,0.3,788.0,205.1,788.0,1112.7,1263.3,35.7,93.5,332.4,8.5,128.1,475.6,357.6,179.8,91.4,443.8,368.1,872.87,1280.0,1373.6,1605.0,35.7,300.2,286.6,443.8,1577.0,8.5,109.4,141.7,1615.7,1470.3,314.3433,34.2121,8.5447,107.2,0.0,181.8,159.1,321.9,168.3,10.6343,560.0837,0.8691,0.9612,9.5805,88.0267,2.8964,10.6343,128.1,81.0061,91.97,10.9639,21.1529,6.6349,0.0,0.0,6.1668,9.6985,0.0,40.9128,14.0994,29.1225,22.7827,9.8471,6.6349,10.4165,6.6349,22.174,22.174,34.8123,12.175,7.2589,7.2589,5.7667,26.4186,47.999,0.7007,1.0862,1.9358,0.0267,9.6668,,7.8109,2.3447,2.2887,5.2732,3.7952,5.6651,0,242.1,0.055204,1.0,1.114698,1.382834,0.048149,0.171173,0.826613,0.203925,0.173063,242.104377,2551.452484,0.143056,0.124672,0.124672,0.150822,108.144779,0.066783,0.073588,4.877496,7.571422,1.209569,0.156118,496.440478,2.001348,1.223544,0.08193,0.826613,1.545117,0.047067,-1.063438,179.180164,0.225399,0.599394,198.877267,0.189557,0.229317,0.845409,0.61136,496.440478,0.205949,0.456224,0.855719,3.375105,2.037056,269.952654,1.352089,3.616945
7,1724.2,1665.8,2424.3,123.7,2424.3,581.9771,905.7,173.5,5.6,314.2,1.1,314.2,1457.9,1467.3,71.2,123.7,204.2,2.6,3.6,265.0,217.4,182.9,215.8,1327.0,275.4,1107.02,1514.5,1610.0,1652.7,71.2,1518.6,668.7,1327.0,137.2,46.1,673.8,291.4,1718.3,1675.3,60.3884,13.2275,0.4841,123.7,0.0,194.8,190.0,146.2,196.4,0.0,249.1102,0.7099,0.8641,17.8509,81.4958,2.6535,0.0,3.6,90.5528,91.1366,0.5839,3.9675,7.1743,0.0,0.0,1.7429,25.8533,0.0,3.4132,24.0741,44.9165,15.9726,11.0196,7.1743,11.3908,6.8789,6.1385,6.4241,10.1997,9.1933,5.9412,6.2176,4.8665,117.8332,34.6914,3.0543,4.8481,0.0282,0.8909,22.7748,20.5036,41.1532,5.3212,10.8544,12.4695,1.2729,2.4309,0,114.2,0.051025,1.0,0.24006,5.220173,0.051025,0.08423,0.687126,0.658213,0.111298,114.201072,4772.7589,0.076476,0.047106,0.047106,0.068556,58.065194,0.074259,0.080394,0.438566,7.793298,1.451975,0.070116,57.20538,16.859942,1.206616,0.078373,0.687126,0.284654,0.089015,-3.310386,68.8456,0.466792,-0.527378,87.374212,0.1136,0.165326,0.373592,0.071567,57.20538,0.162622,0.335442,0.966503,6.286038,5.301719,38.016268,9.601153,1.255313
8,61.2,55.2,84.8,-5.2,84.8,84.1312,54.9,53.1,0.2,19.6,5.1,19.6,44.3,49.8,1.6,-5.2,-0.6,1.0,4.4,21.3,-4.6,-10.5,22.4,23.1,1.0,43.83,61.4,50.9,55.0,1.6,29.9,13.8,23.1,39.9,1.2,-3.2,12.4,61.1,39.7,8.2914,-61.6895,-4.3019,-5.2,0.0,-6.1,-6.3,-6.2,-4.6,,400.0,0.5428,-7.8503,106.9143,-14.3699,7.2018,,4.4,87.0334,97.8389,10.8055,-8.75,-8.4967,0.0,0.0,20.0,160.0,0.0,550.0,-110.0,-520.0,1.634,-10.2941,-8.4967,-7.5163,-8.0196,-22.3744,-23.7443,-21.0046,-16.1043,-7.5153,-7.9755,-4.3459,139.9599,35.7013,0.4275,0.9397,2.1813,0.0452,79.658,,1.5088,1.4136,0.4841,3.0099,2.3691,2.8716,0,10.3,-0.061321,1.0,0.992113,1.033898,-0.061321,-0.007075,0.650943,0.193974,0.21558,10.311792,2601.008403,0.14033,0.121462,0.121462,0.186594,140.842391,-0.094203,-0.042453,3.642043,4.440296,1.532609,0.20471,442.197125,1.772128,1.10967,-0.074292,0.650943,1.059937,0.264151,-0.752548,129.601449,-0.244131,0.59887,177.378508,0.011792,0.018116,0.647406,0.626179,442.197125,0.969697,0.205978,0.922101,2.591549,2.816327,351.11413,1.039548,2.38961
9,18.4,0.2,108.6,12.3,108.6,732.875,106.5,66.3,0.9,44.1,4.6,44.1,5.0,5.5,0.5,12.3,12.9,0.3,0.1,36.9,-4.8,12.4,40.0,2.7,13.4,2.14,5.5,6.1,0.2,0.5,2.1,2.1,2.7,0.2,18.2,40.2,1.1,18.4,0.2,106.4068,-170.8769,-99.6299,12.3,0.0,12.4,12.4,-5.3,12.8,0.0,9.5238,0.2627,-6.3605,104.1297,-64.8426,60.0734,0.0,0.1,81.9672,90.1639,8.1967,0.6813,66.8478,0.0,0.0,0.0,3.7313,0.0,3.7313,0.7463,91.791,72.8261,67.3913,66.8478,69.5652,66.8478,35.0927,35.0927,36.5193,31.5924,31.3376,31.3376,17.5589,1014.144,41.4085,0.6848,1.6063,0.1699,0.0151,66.3636,,,0.0075,0.0133,12.2667,0.1429,0.1818,0,12.3,0.11326,1.0,6.748389,1.606335,0.11326,0.118785,0.001842,0.18552,64.0,12.302762,3096.796875,0.117864,0.11326,0.11326,61.5,67342.5,61.5,0.117864,271.435185,4.687671,538.5,63.0,11308.17757,0.158371,0.096685,0.11418,0.001842,1.64539,0.368324,-1.197492,80482.5,0.333333,0.443439,6293.691589,0.123389,67.0,0.980663,0.610497,11308.17757,14.814815,-9.7,30.5,0.00542,0.004535,120997.5,0.003017,0.074074


In [9]:
df.shape

(4770, 145)

In [10]:
df.describe()

Unnamed: 0,sa_total_income,sa_sales,sa_total_assets,sa_pat,sa_total_liabilities,sa_gross_working_capital_cosm,sa_current_assets_incl_st_invest_loans,sa_current_liabilities,sa_cash_bal,sa_st_trade_bills_receivables,sa_debtors_more_6m,sa_st_trade_receivables,sa_nf_operating_expenses,sa_f_operating_expenses,sa_dep_owned_ast,sa_retained_profits,sa_pbit,sa_interest_inc,sa_interest_exp,sa_st_inventories,sa_pbdita_net_of_peoifi,sa_pbpt_net_of_peoi,sa_total_capital,sa_gross_fixed_assets,sa_pbdita,sa_cost_of_goods_sold,sa_cost_of_sales,sa_total_expense,sa_net_sales,sa_depreciation,sa_non_current_assets,sa_net_fixed_assets,sa_gross_fixed_assets.1,sa_non_fin_services_inc,sa_inc_fin_serv,sa_net_working_capital,sa_non_current_liabilities,sa_tot_inc_net_of_pe,sa_sales_n_chg_in_stk,sa_chg_in_assets_with_no_chg_in_efficiency,sa_chg_in_efficiency_with_no_chg_in_assets,sa_chg_in_efficiency_on_chg_in_assets,sa_reported_pat,sa_diff_in_pat,sa_pbpt,sa_pbt,sa_pbit_net_of_peoifi,sa_cash_profit,sa_equity_div_inc_dist_pc_pat,sa_sales_net_fixed_assets,sa_total_income_avg_tot_asset_net_miscexp_now_reval,sa_chg_in_efficiency_in_use_of_assets,sa_pc_chg_in_efficiency_with_no_chg_in_assets,sa_pc_chg_in_assets_with_no_chg_in_efficiency,sa_pc_chg_in_efficiency_on_chg_in_assets,sa_total_div_pc_pat,sa_total_interest_exp,sa_nf_oper_exp_pc_total_exp,sa_f_oper_exp_pc_total_exp,sa_fin_serv_exp_pc_total_exp,sa_pbpt_net_of_peoi_inc_fin_serv,sa_pat_cont_ops_pc_inc_cont_ops,sa_pat_discont_ops_pc_inc_discont_ops,sa_total_provisions_pc_pbdita,sa_write_offs_pc_pbdita,sa_depreciation_pc_pbdita,sa_amortisation_pc_pbdita,sa_fin_serv_exp_pc_pbdita,sa_prov_direct_tax_pc_pbdita,sa_pat_pc_pbdita,sa_pbdita_pc_total_inc,sa_pbt_pc_total_inc,sa_pat_pc_total_inc,sa_cash_profit_pc_total_inc,sa_pat_net_of_pe_pc_tot_inc_net_of_pe,sa_pat_net_of_pe_pc_avg_networth,sa_pat_pc_avg_networth,sa_cash_profit_pc_avg_networth,sa_pbpt_net_of_peoi_pc_avg_capital_employed,sa_pat_net_of_pe_pc_avg_capital_employed,sa_pat_pc_avg_capital_employed,sa_pat_net_of_pe_pc_avg_tot_asset_net_menow_reval,sa_pc_chg_in_profitability_with_no_chg_in_income,sa_st_trade_bills_receivables_pc_current_assets_incl_st_invest_loans,sa_quick_ratio,sa_current_ratio,sa_debt_equity,sa_cash_n_bank_no_fd_security_current_liab_n_prov,sa_cash_n_bank_no_fd_security_cost_of_sales_per_day,sa_rawmat_stores_spares_avg_stk_rawmat_stores,sa_cost_of_goods_sold_avg_stk_fg,sa_sales_avg_debtors,sa_creditors_turnover,sa_total_inc_net_of_pe_compensation_to_empl,sa_sales_avg_gfa_net_of_reval,sa_sales_net_repairs_avg_nfa_net_of_reval,delisted,sa_gross_profit,X1,X2,X3,X4,X6,X7,X9,X12,X13,X14,X15,X16,X17,X18,X19,X20,X23,X26,X28,X29,X30,X31,X32,X33,X34,X35,X36,X37,X38,X40,X44,X45,X46,X47,X48,X49,X50,X51,X52,X54,X56,X58,X60,X61,X62,X63,X64
count,4558.0,3847.0,4765.0,4748.0,4769.0,4770.0,4686.0,4622.0,3634.0,3927.0,2454.0,3926.0,4748.0,4748.0,3870.0,4748.0,4748.0,3718.0,3380.0,3348.0,4748.0,4748.0,4764.0,4270.0,4748.0,4770.0,4734.0,4748.0,4021.0,3866.0,4637.0,4298.0,4270.0,2802.0,3948.0,4766.0,3987.0,4558.0,3889.0,4662.0,4662.0,4662.0,4682.0,4748.0,4748.0,4748.0,4748.0,4748.0,3208.0,4412.0,4749.0,4616.0,4475.0,4475.0,4475.0,3208.0,3381.0,4769.0,4769.0,4769.0,3948.0,4577.0,4755.0,4694.0,4694.0,4716.0,4716.0,4716.0,4716.0,4716.0,4580.0,4580.0,4580.0,4580.0,4545.0,4211.0,4211.0,4211.0,4594.0,4594.0,4594.0,4749.0,4313.0,4770.0,4677.0,4677.0,4202.0,4677.0,4731.0,2389.0,2496.0,4069.0,4112.0,4511.0,4324.0,4187.0,4770.0,4558.0,4745.0,4764.0,4764.0,4543.0,4745.0,4745.0,3847.0,4435.0,3469.0,3718.0,3826.0,3826.0,4558.0,4557.0,3847.0,3067.0,3847.0,3866.0,4270.0,4764.0,3144.0,3173.0,4622.0,4607.0,4748.0,4745.0,3847.0,3314.0,4760.0,3113.0,3562.0,3346.0,3314.0,3348.0,4745.0,3847.0,4686.0,4618.0,4622.0,4267.0,3847.0,3847.0,3067.0,3562.0,3786.0,3786.0,3641.0
mean,14560.05,13134.03,48026.59,821.910573,47986.31,13680.7,6950.264,7075.376,185.190451,1750.664961,376.272657,1744.73892,9732.61,11756.21,547.124367,426.176769,3764.759,3202.353,2696.201,2163.843578,1008.672641,1607.02976,679.011062,8718.369,4210.232,7709.091,10192.53,13257.45,11458.29,543.217563,14197.57,6201.619,8718.369,3037.192291,3688.992,2003.017,7468.468,14372.07,13116.65,1336.838939,-533.852508,-103.901618,833.414716,0.080813,1741.162511,1169.875864,563.199663,1722.125695,10.863964,3452.441,0.801036,1.09736,44.182752,158.369793,-2.67338,10.995695,2751.236,75.444923,86.905399,11.460477,-18.262312,-435.9708,-5.011796,371.224,-2.928142,70.645757,0.175411,733.221,-999.3859,-71.700478,-58.309293,-443.2165,-443.4199,-271.904788,-628.3063,-13.354656,-10.50308,3.129449,0.265408,-3.089982,-0.785409,-5.378135,-318.9223,29.817643,7.104117,15.945312,1.687443,4.378708,370.899971,13.101025,145.507223,26.997859,25.146824,37.400743,30.94896,39.56158,0.099581,750.806406,-inf,1.0,1.019671,26.225871,-inf,-inf,0.856938,1.962951,10.591276,929.347929,inf,-0.013844,-inf,-0.080422,8.022579,48068.27,8.09366,-0.017958,24.478803,-inf,656.4604,94.848735,inf,12.468867,inf,-inf,0.856938,0.67864,inf,16.701067,2513.23,1.368331,-4.347788,inf,-inf,68.518591,0.51854,inf,inf,42.710004,-5.343211,71.97413,61.337251,25.723667,97496.33,6.506462,30.304098
std,112292.4,110800.9,523618.3,9792.039665,523400.4,358490.2,40727.99,48852.58,2855.562575,8561.556954,3919.748256,8548.533155,91653.01,97346.73,4420.194534,7270.460805,35933.9,39336.65,26913.28,15331.824441,16338.800193,15392.488957,3620.387527,76160.02,37469.5,70308.8,92342.79,105605.8,92714.04,4414.565557,124350.1,53590.5,76160.02,28488.95763,44809.44,58205.59,67704.15,111686.9,112662.5,13869.489605,8318.226826,1881.039795,9856.496043,157.680992,16476.973407,12852.821041,13923.100817,15614.708489,77.357341,42133.78,1.289885,33.565978,939.904515,6819.019289,386.29581,77.385649,26971.31,28.059734,21.250018,19.244502,532.639947,17818.01,199.405802,24265.65,467.884786,5293.12708,36.816397,49971.35,69956.32,9678.448057,1684.230263,17823.71,17819.49,8909.276325,20279.72,628.121158,616.170909,355.790844,73.813099,78.374472,90.233435,146.097294,26967.97,27.062082,74.556903,141.216442,13.239338,65.617848,2620.77392,44.041993,1838.263207,444.092839,616.021871,199.877845,482.757661,489.694085,0.299472,9216.191019,,0.0,15.304503,225.907245,,,1.013714,41.926212,460.108676,10190.451679,,1.398582,,2.904731,435.51663,2561047.0,435.511066,1.415477,411.613635,,21557.81,3279.769212,,89.987573,,,1.013714,2.729486,,518.745977,43161.1,99.516275,63.189885,,,2435.469215,0.311188,,,372.085653,145.80899,2353.807685,679.723845,348.769426,2971770.0,47.555088,377.488718
min,-1.3,-1.5,-35.7,-99256.0,-35.7,0.0,0.1,0.1,0.1,0.1,0.0,0.1,-294.3,-196.4,0.0,-104712.0,-29122.9,0.1,0.0,0.1,-441797.1,-52287.0,0.1,0.1,-28961.6,-425.27,-416.1,-181.2,-680.4,0.1,-52.0,-61.0,0.1,-1.5,0.1,-1257216.0,0.0,-1.3,-1326.8,-84468.1787,-250553.9202,-73650.4141,-99256.0,-8006.0,-74028.0,-86180.1,-464730.2,-48046.3,-0.0947,0.0,-5.0929,-642.0,-25622.7702,-25705.971,-10883.4185,-0.0947,0.1,-400.0,-400.0,-54.0287,-20553.0,-1189500.0,-12100.0,-4033.505,-19025.0,-34000.0,-2000.0,-33525.0,-4803450.0,-647700.0,-101700.0,-1189500.0,-1189500.0,-574300.0,-1155200.0,-40020.0,-39320.0,-22180.0,-3440.0,-3440.0,-3440.0,-8733.3333,-1751650.0,0.0,-24.5294,-0.6268,0.0,-25.5294,-260.7143,-15.0,-1.9629,-0.0815,-0.0565,-3.25,-180.9806,-44.0,0.0,-99256.0,-inf,1.0,0.0,0.000249,-inf,-inf,-0.014837,-595.0,-5720.0,-99255.999144,-5.365408e+20,-61.0,-inf,-174.0,-6886.0,-730.0,-6886.0,-61.0,0.0,-inf,-67.33333,-4012.5,-2986.363636,-10.760965,-0.170098,-inf,-0.014837,-94.0,-1.40056,-302.333,-4209.667,-2545.025641,-2475.0,-14434.09,-inf,-360.8,-0.081232,7.7e-05,-2986.363636,0.000128,-8281.342857,-41.666667,-0.5,-0.086705,-1971.0,-0.185185,2.5e-05
25%,30.7,59.95,133.3,-0.7,132.4,1.201775,55.025,20.425,0.2,19.8,4.0,19.7,10.675,15.6,2.4,-0.9,0.4,1.1,3.9,21.825,-2.0,-1.1,47.0,27.6,1.1,6.7225,12.825,22.175,37.6,2.4,46.8,10.225,27.6,4.725,1.7,-10.175,11.8,26.875,53.6,-0.674575,-114.262675,-11.772575,-0.7,0.0,-0.3,-0.6,-3.7,0.0,0.0,20.53265,0.0969,-0.2718,16.24905,-8.27805,-6.7844,0.0,4.0,64.7059,85.6187,0.8649,-0.12,-0.894,0.0,0.0,0.0,0.0,0.0,0.80115,0.0,12.835575,4.263175,-0.798675,-1.035525,0.28665,-2.3559,-0.2302,0.0,0.43735,-0.977175,-1.07045,-0.55145,-1.252,46.2717,3.027075,0.3366,0.8396,0.004,0.016,4.20195,2.9114,6.6789,1.3032,0.61975,4.7472,0.1721,0.45085,0.0,-4.175,-0.007995,1.0,0.006471,1.027318,-0.008772,0.004077,0.18017,-0.053965,-0.001724,-4.735941,-333.8074,-0.001142,-0.016587,-0.016564,-0.032504,28.96147,-0.003086,0.003008,0.119652,4.894849,0.7983436,-0.009696,116.374111,1.353203,0.142857,-0.008182,0.18017,0.25571,0.037452,-1.425581,40.60134,-0.011626,0.200459,38.6585,0.00949,0.044174,0.282898,0.091081,116.374111,0.101183,0.059404,0.962054,3.200098,2.364288,78.98834,0.989945,0.710932
50%,455.8,628.2,650.3,3.9,646.3,151.1517,316.75,211.35,0.6,139.1,21.65,138.85,302.15,344.05,18.2,3.2,22.65,5.0,26.1,141.25,6.2,4.1,101.5,271.75,33.95,243.805,330.05,399.3,518.8,18.3,271.5,129.95,271.75,48.25,8.75,31.4,97.5,435.2,603.6,1.4918,-0.6855,-0.01595,4.3,0.0,6.9,5.05,1.8,10.9,0.0,236.6578,0.4997,0.2699,87.9158,12.6447,0.4644,0.0,26.6,87.8167,94.135,3.2727,0.85985,2.3403,0.0,0.0,0.0,9.80475,0.0,17.8379,6.86935,39.72645,12.47925,3.32575,2.43405,5.7614,2.1495,3.1546,3.6,7.9895,2.24605,1.4525,1.77805,0.9544,91.3714,25.6914,0.7819,1.3486,0.277,0.079,16.2286,6.3741,15.3993,4.1062,3.4375,10.705,1.414,2.7303,0.0,2.85,0.011258,1.0,0.247049,1.581411,0.009847,0.049802,0.668327,0.052098,0.056022,7.905203,4040.371,0.034333,0.010303,0.010319,0.022849,58.2544,0.02381,0.037127,0.692631,6.478509,1.338099,0.04251,240.299109,4.1976,0.872274,0.014718,0.668327,0.509422,0.143149,-0.990776,77.4392,0.12231,0.570351,82.73157,0.066798,0.116159,0.524214,0.279163,240.299109,0.38253,0.210596,1.009328,6.260408,4.710599,150.405,2.424783,1.889629
75%,3447.8,3898.3,4820.4,88.3,4812.7,1264.935,1922.825,1576.625,2.0,741.9,92.075,741.1,2582.4,2842.05,131.4,74.225,267.825,29.875,158.725,736.575,192.625,113.95,247.325,1847.6,360.575,2164.39,2766.5,3149.675,3393.4,131.475,2154.4,1108.8,1847.6,458.175,73.125,233.15,725.6,3401.125,3803.0,146.673925,23.7838,1.79515,91.375,0.0,136.525,119.975,128.025,155.9,5.166025,669.3752,1.1513,1.717925,107.65125,80.4062,8.32045,5.3999,162.1,94.1122,97.9381,11.5385,7.513825,9.0756,0.0,0.0,0.128025,26.155825,0.0,48.9897,18.3216,66.002475,28.8142,12.45683,9.11545,14.690475,8.4506,11.77735,12.44415,20.64445,9.41465,6.693275,7.38575,4.7562,111.0994,48.057725,1.7481,2.8736,1.005475,0.5357,91.25,11.9115,39.590175,8.1929,7.3156,23.8382,3.8516,7.4979,0.0,92.225,0.048041,1.0,0.517716,3.836602,0.041975,0.102553,1.185354,0.303796,0.142857,158.00423,10376.17,0.088331,0.053003,0.053005,0.095877,113.8233,0.083349,0.084318,2.084828,8.481317,3.762139,0.138064,969.850095,8.470155,2.000511,0.064326,1.185354,0.868037,0.51514,-0.55755,153.8974,0.562551,0.829235,176.4824,0.129182,0.24065,0.750547,0.498805,969.850095,2.720598,0.334169,1.19955,12.576208,8.969016,367.8688,4.618635,4.738487
max,4575377.0,4527164.0,27059660.0,314250.0,27059660.0,22687520.0,1273003.0,1515580.0,120303.1,272231.6,172527.9,272231.6,4283153.0,4320302.0,140044.4,314250.0,1652979.0,1755182.0,1136585.0,623701.9,435700.0,451913.3,102593.2,2973520.0,1675912.0,3044451.0,4194499.0,4536911.0,3657623.0,140044.4,4412710.0,1545780.0,2973520.0,926980.0,2056212.0,2211548.0,1878432.0,4570759.0,4679762.0,484443.9706,218008.1552,44637.1934,314250.0,7139.9,513409.8,407770.0,349000.0,486767.3,2535.0,2120600.0,44.0,860.6667,20103.2212,449418.4615,10628.1783,2535.0,1136585.0,275.0,300.0,117.6314,13410.0,4266.667,134.947,1660750.0,13065.7895,360000.0,1350.0,3430500.0,77066.67,33625.0,1126.9136,669.2308,4266.667,153.8462,4266.667,445.8128,1664.4746,1702.9307,332.5318,280.0,3422.2222,121.223,135734.0,100.0,3752.0,5910.0,530.3462,3742.0,108364.4444,1023.0,85382.4,22794.0,35168.0,6807.7477,21604.0,21604.0,1.0,278590.0,3.381818,1.0,676.07764,8664.0,3.381818,301.193548,22.279236,2017.0,18446.285714,278590.006456,inf,3.4,3.381818,3.381818,17962.0,141816400.0,17962.0,3.4,20999.0,17.113555,1146629.0,171515.571429,inf,4765.5,inf,3.381818,22.279236,53.848485,inf,24140.0,1996550.0,2534.0,0.999967,inf,304.258065,137124.714286,8.428571,inf,inf,12348.76,1.157143,136761.0,21450.75,17095.5,128328200.0,2410.0,15799.0


In [11]:
df.isnull().sum()

sa_total_income                                                          212
sa_sales                                                                 923
sa_total_assets                                                            5
sa_pat                                                                    22
sa_total_liabilities                                                       1
sa_gross_working_capital_cosm                                              0
sa_current_assets_incl_st_invest_loans                                    84
sa_current_liabilities                                                   148
sa_cash_bal                                                             1136
sa_st_trade_bills_receivables                                            843
sa_debtors_more_6m                                                      2316
sa_st_trade_receivables                                                  844
sa_nf_operating_expenses                                                  22

In [None]:
df.isif

In [12]:
#write to file
df.to_csv('../data/model_data_feature_engineered.csv')