## Data Cleaning

In [1]:
import pandas as pd
import numpy as np


In [2]:
pd.set_option('display.max_columns', 50)
pd.set_option('display.max_rows', 7000)

In [3]:
df_mf = pd.read_csv('../Data/df_all_mutual_fund_data')

In [4]:
df_mf.head()

Unnamed: 0,ticker,morningstar_risk,avg_moat_rating,morningstar_sustainability_rating,three_year_return,three_year_mean_div_yield,pct_cash,price_to_earnings,price_to_cash_flow,avg_market_cap,roe_last_year,debt_to_capital_last_year,no_of_holdings_in_portfolio,pct_assets_in_top10_holdings,turnover,avg_manager_tenure,expense_ratio,no_load_funds,min_initial_purchase,total_assets,closed_to_new_investors,sp500_three_year_return
0,AAAGX,Above Average,4.283,3,20.73,1.97,1.69,32.14,24.23,294701,31.56,44.55,45,55.73,58,2,1.14,No,2000.0,1768,No,34.2
1,AACIX,High,--,2,0.22,0.48,3.79,12.96,6.84,8740,2.21,48.49,124,18.37,35,6,0.95,Yes,250000.0,195,No,34.2
2,AADEX,Above Average,3.459,2,3.75,0.67,1.72,15.04,10.34,57742,12.54,48.12,168,21.82,67,12,0.63,Yes,250000.0,4242,No,34.2
3,AADGX,Below Average,3.347,3,6.39,0.66,2.62,21.85,16.11,14323,26.21,40.21,51,24.66,47,5,1.08,Yes,2500.0,70,No,34.2
4,AAGOX,Above Average,3.748,2,27.82,2.38,0.22,42.08,26.35,152652,21.25,36.98,59,47.3,144,19,0.89,Yes,0.0,446,No,34.2


### Rename columns

In [5]:
df_mf.columns = ['Ticker','Morningstar Risk','Average Moat Rating','Morningstar Sustainability Rating',
                 '3-year Return (%)','Dividend Yield (%)','% of Holdings in Cash','Price/Earnings',
                 'Price/Cash Flow','Average Market Cap ($ mil)','ROE Last Year (%)','Debt/Capital Last Year (%)',
                 'No. of Holdings in Portfolio','% Assets in Top 10 Holdings','Turnover Ratio (%)',
                 'Average Manager Tenure (years)','Expense Ratio (%)','No-load Funds','Minimum Initial Purchase ($)',
                 'Total Assets ($ mil)','Closed to New Investors','S&P500 3-year Return (%)']

In [6]:
df_mf.head()

Unnamed: 0,Ticker,Morningstar Risk,Average Moat Rating,Morningstar Sustainability Rating,3-year Return (%),Dividend Yield (%),% of Holdings in Cash,Price/Earnings,Price/Cash Flow,Average Market Cap ($ mil),ROE Last Year (%),Debt/Capital Last Year (%),No. of Holdings in Portfolio,% Assets in Top 10 Holdings,Turnover Ratio (%),Average Manager Tenure (years),Expense Ratio (%),No-load Funds,Minimum Initial Purchase ($),Total Assets ($ mil),Closed to New Investors,S&P500 3-year Return (%)
0,AAAGX,Above Average,4.283,3,20.73,1.97,1.69,32.14,24.23,294701,31.56,44.55,45,55.73,58,2,1.14,No,2000.0,1768,No,34.2
1,AACIX,High,--,2,0.22,0.48,3.79,12.96,6.84,8740,2.21,48.49,124,18.37,35,6,0.95,Yes,250000.0,195,No,34.2
2,AADEX,Above Average,3.459,2,3.75,0.67,1.72,15.04,10.34,57742,12.54,48.12,168,21.82,67,12,0.63,Yes,250000.0,4242,No,34.2
3,AADGX,Below Average,3.347,3,6.39,0.66,2.62,21.85,16.11,14323,26.21,40.21,51,24.66,47,5,1.08,Yes,2500.0,70,No,34.2
4,AAGOX,Above Average,3.748,2,27.82,2.38,0.22,42.08,26.35,152652,21.25,36.98,59,47.3,144,19,0.89,Yes,0.0,446,No,34.2


In [7]:
df_mf.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 6521 entries, 0 to 6520
Data columns (total 22 columns):
 #   Column                             Non-Null Count  Dtype  
---  ------                             --------------  -----  
 0   Ticker                             6521 non-null   object 
 1   Morningstar Risk                   6521 non-null   object 
 2   Average Moat Rating                6521 non-null   object 
 3   Morningstar Sustainability Rating  6521 non-null   object 
 4   3-year Return (%)                  6521 non-null   object 
 5   Dividend Yield (%)                 6521 non-null   object 
 6   % of Holdings in Cash              6521 non-null   float64
 7   Price/Earnings                     6521 non-null   object 
 8   Price/Cash Flow                    6521 non-null   object 
 9   Average Market Cap ($ mil)         6521 non-null   object 
 10  ROE Last Year (%)                  6521 non-null   object 
 11  Debt/Capital Last Year (%)         6521 non-null   objec

### Fill missing values: The values are not actually missing.  They show up once we go to each mutual fund's specific webpage.  Therefore the process is manual and time consuming but better than imputing guesstimates (Beautiful Soup wouldn't have worked for certain metrics because the pages were dynamic.   Could have used Selenium)

In [8]:
df_mf.drop(df_mf[df_mf['Morningstar Risk']=='--'].index, inplace=True)

In [9]:
df_mf.drop('Average Moat Rating', axis=1, inplace=True)

In [10]:
df_mf.drop(df_mf[df_mf['ROE Last Year (%)']=='--'].index, inplace=True)

In [11]:
pe_mean = df_mf['Price/Earnings'].astype(float).mean()

In [12]:
pcf_mean = df_mf[df_mf['Price/Cash Flow']!='--']['Price/Cash Flow'].astype(float).mean()

In [13]:
pe_pcf_diff = pe_mean - pcf_mean

In [14]:
pe_pcf_diff

7.734677027501206

In [15]:
df_mf.loc[df_mf['Price/Cash Flow']=='--','Price/Cash Flow'] = df_mf.loc[df_mf['Price/Cash Flow']=='--','Price/Earnings'].astype(float) - pe_pcf_diff

In [16]:
df_mf.drop(df_mf[df_mf['% Assets in Top 10 Holdings']=='--'].index, inplace=True)

In [17]:
df_mf['3-year Return (%)'].value_counts().head()

--       294
12.18      9
4.77       9
3.88       9
2.57       9
Name: 3-year Return (%), dtype: int64

In [18]:
df_mf.loc[df_mf['Ticker']=='ABCRX','3-year Return (%)'] = '8.89'
df_mf.loc[df_mf['Ticker']=='ACFGX','3-year Return (%)'] = '32.62'
df_mf.loc[df_mf['Ticker']=='ACMSX','3-year Return (%)'] = '-2.35'
df_mf.loc[df_mf['Ticker']=='ADNAX','3-year Return (%)'] = '48.84'
df_mf.loc[df_mf['Ticker']=='ADNCX','3-year Return (%)'] = '47.73'
df_mf.loc[df_mf['Ticker']=='ADNRX','3-year Return (%)'] = '49.24'
df_mf.loc[df_mf['Ticker']=='AEIMX','3-year Return (%)'] = '5.49'
df_mf.loc[df_mf['Ticker']=='AFEDX','3-year Return (%)'] = '12.75'
df_mf.loc[df_mf['Ticker']=='AFEGX','3-year Return (%)'] = '13.02'
df_mf.loc[df_mf['Ticker']=='AMDRX','3-year Return (%)'] = '0.67'
df_mf.loc[df_mf['Ticker']=='ANOHX','3-year Return (%)'] = '26.1'
df_mf.loc[df_mf['Ticker']=='APDTX','3-year Return (%)'] = '21.04'
df_mf.loc[df_mf['Ticker']=='APHTX','3-year Return (%)'] = '21.02'
df_mf.loc[df_mf['Ticker']=='APSRX','3-year Return (%)'] = '19.28'
df_mf.loc[df_mf['Ticker']=='ASCFX','3-year Return (%)'] = '10.97'
df_mf.loc[df_mf['Ticker']=='ASEFX','3-year Return (%)'] = '11.57'
df_mf.loc[df_mf['Ticker']=='ASPYX','3-year Return (%)'] = '21.36'
df_mf.loc[df_mf['Ticker']=='ASVHX','3-year Return (%)'] = '8.37'
df_mf.loc[df_mf['Ticker']=='ATFFX','3-year Return (%)'] = '22.37'
df_mf.loc[df_mf['Ticker']=='AULNX','3-year Return (%)'] = '24.69'
df_mf.loc[df_mf['Ticker']=='BAFMX','3-year Return (%)'] = '19.33'
df_mf.loc[df_mf['Ticker']=='BDBPX','3-year Return (%)'] = '11.64'
df_mf.loc[df_mf['Ticker']=='BGFRX','3-year Return (%)'] = '20.93'
df_mf.loc[df_mf['Ticker']=='BIIGX','3-year Return (%)'] = '16.5'
df_mf.loc[df_mf['Ticker']=='BLYRX','3-year Return (%)'] = '15.55'
df_mf.loc[df_mf['Ticker']=='BSGRX','3-year Return (%)'] = '19.91'
df_mf.loc[df_mf['Ticker']=='BSMRX','3-year Return (%)'] = '0.72'
df_mf.loc[df_mf['Ticker']=='BSPGX','3-year Return (%)'] = '12.45'
df_mf.loc[df_mf['Ticker']=='BSPPX','3-year Return (%)'] = '12.1'
df_mf.loc[df_mf['Ticker']=='BUIDX','3-year Return (%)'] = '10.47'
df_mf.loc[df_mf['Ticker']=='BUIEX','3-year Return (%)'] = '16.27'
df_mf.loc[df_mf['Ticker']=='BUIMX','3-year Return (%)'] = '17.46'
df_mf.loc[df_mf['Ticker']=='BUIOX','3-year Return (%)'] = '24.91'
df_mf.loc[df_mf['Ticker']=='BUISX','3-year Return (%)'] = '32.23'
df_mf.loc[df_mf['Ticker']=='BUITX','3-year Return (%)'] = '17.32'
df_mf.loc[df_mf['Ticker']=='BVDRX','3-year Return (%)'] = '0.11'
df_mf.loc[df_mf['Ticker']=='CABGX','3-year Return (%)'] = '18.2'
df_mf.loc[df_mf['Ticker']=='CALRX','3-year Return (%)'] = '10.8'
df_mf.loc[df_mf['Ticker']=='CBMYX','3-year Return (%)'] = '5.53'
df_mf.loc[df_mf['Ticker']=='CERPX','3-year Return (%)'] = '10.46'
df_mf.loc[df_mf['Ticker']=='CFDAX','3-year Return (%)'] = '4.63'
df_mf.loc[df_mf['Ticker']=='CGQGX','3-year Return (%)'] = '12.53'
df_mf.loc[df_mf['Ticker']=='CGRGX','3-year Return (%)'] = '12.85'
df_mf.loc[df_mf['Ticker']=='CISGX','3-year Return (%)'] = '28.82'
df_mf.loc[df_mf['Ticker']=='CLIQX','3-year Return (%)'] = '7.11'
df_mf.loc[df_mf['Ticker']=='CPTUX','3-year Return (%)'] = '18.32'
df_mf.loc[df_mf['Ticker']=='CSCLX','3-year Return (%)'] = '11.21'
df_mf.loc[df_mf['Ticker']=='CSDGX','3-year Return (%)'] = '9.38'
df_mf.loc[df_mf['Ticker']=='CTSOX','3-year Return (%)'] = '28.73'
df_mf.loc[df_mf['Ticker']=='CVSDX','3-year Return (%)'] = '6.03'
df_mf.loc[df_mf['Ticker']=='DGEZX','3-year Return (%)'] = '3.2'
df_mf.loc[df_mf['Ticker']=='DIGGX','3-year Return (%)'] = '26.15'
df_mf.loc[df_mf['Ticker']=='DLCZX','3-year Return (%)'] = '11.59'
df_mf.loc[df_mf['Ticker']=='DMCFX','3-year Return (%)'] = '21.09'
df_mf.loc[df_mf['Ticker']=='DSEPX','3-year Return (%)'] = '15.31'
df_mf.loc[df_mf['Ticker']=='DSFRX','3-year Return (%)'] = '15.64'
df_mf.loc[df_mf['Ticker']=='DSMZX','3-year Return (%)'] = '16.12'
df_mf.loc[df_mf['Ticker']=='EAFRX','3-year Return (%)'] = '-0.06'
df_mf.loc[df_mf['Ticker']=='EGWRX','3-year Return (%)'] = '30.16'
df_mf.loc[df_mf['Ticker']=='EPLMX','3-year Return (%)'] = '3.88'
df_mf.loc[df_mf['Ticker']=='FAFGX','3-year Return (%)'] = '17.8'
df_mf.loc[df_mf['Ticker']=='FAOOX','3-year Return (%)'] = '8.13'
df_mf.loc[df_mf['Ticker']=='FCIAX','3-year Return (%)'] = '8.12'
df_mf.loc[df_mf['Ticker']=='FEEFX','3-year Return (%)'] = '9.28'
df_mf.loc[df_mf['Ticker']=='FERFX','3-year Return (%)'] = '-0.01'
df_mf.loc[df_mf['Ticker']=='FFAFX','3-year Return (%)'] = '17.8'
df_mf.loc[df_mf['Ticker']=='FFFMX','3-year Return (%)'] = '6.33'
df_mf.loc[df_mf['Ticker']=='FFMMX','3-year Return (%)'] = '6.33'
df_mf.loc[df_mf['Ticker']=='FFQBX','3-year Return (%)'] = '25.58'
df_mf.loc[df_mf['Ticker']=='FFQCX','3-year Return (%)'] = '24.67'
df_mf.loc[df_mf['Ticker']=='FFQRX','3-year Return (%)'] = '25.36'
df_mf.loc[df_mf['Ticker']=='FFQSX','3-year Return (%)'] = '25.93'
df_mf.loc[df_mf['Ticker']=='FFXFX','3-year Return (%)'] = '9.27'
df_mf.loc[df_mf['Ticker']=='FGPGX','3-year Return (%)'] = '12.82'
df_mf.loc[df_mf['Ticker']=='FIKNX','3-year Return (%)'] = '6.03'
df_mf.loc[df_mf['Ticker']=='FMCMX','3-year Return (%)'] = '12.33'
df_mf.loc[df_mf['Ticker']=='FMMMX','3-year Return (%)'] = '12.33'
df_mf.loc[df_mf['Ticker']=='FMVQX','3-year Return (%)'] = '3.83'
df_mf.loc[df_mf['Ticker']=='FPGGX','3-year Return (%)'] = '12.84'
df_mf.loc[df_mf['Ticker']=='FTHAX','3-year Return (%)'] = '7.46'
df_mf.loc[df_mf['Ticker']=='FTXAX','3-year Return (%)'] = '23.45'
df_mf.loc[df_mf['Ticker']=='FTXCX','3-year Return (%)'] = '22.74'
df_mf.loc[df_mf['Ticker']=='FTYCX','3-year Return (%)'] = '6.76'
df_mf.loc[df_mf['Ticker']=='FWMMX','3-year Return (%)'] = '7.91'
df_mf.loc[df_mf['Ticker']=='FWWMX','3-year Return (%)'] = '7.91'
df_mf.loc[df_mf['Ticker']=='GABPX','3-year Return (%)'] = '5.6'
df_mf.loc[df_mf['Ticker']=='GACPX','3-year Return (%)'] = '20.24'
df_mf.loc[df_mf['Ticker']=='GALPX','3-year Return (%)'] = '14.81'
df_mf.loc[df_mf['Ticker']=='GCEUX','3-year Return (%)'] = '13.55'
df_mf.loc[df_mf['Ticker']=='GCTRX','3-year Return (%)'] = '9.36'
df_mf.loc[df_mf['Ticker']=='GGGPX','3-year Return (%)'] = '14.52'
df_mf.loc[df_mf['Ticker']=='GGQPX','3-year Return (%)'] = '21.16'
df_mf.loc[df_mf['Ticker']=='GGYPX','3-year Return (%)'] = '7.24'
df_mf.loc[df_mf['Ticker']=='GGZPX','3-year Return (%)'] = '13.17'
df_mf.loc[df_mf['Ticker']=='GIDWX','3-year Return (%)'] = '9.44'
df_mf.loc[df_mf['Ticker']=='GMAPX','3-year Return (%)'] = '7.97'
df_mf.loc[df_mf['Ticker']=='GMHPX','3-year Return (%)'] = '7.8'
df_mf.loc[df_mf['Ticker']=='GMPPX','3-year Return (%)'] = '8.57'
df_mf.loc[df_mf['Ticker']=='GMXPX','3-year Return (%)'] = '2.48'
df_mf.loc[df_mf['Ticker']=='GMYPX','3-year Return (%)'] = '4.73'
df_mf.loc[df_mf['Ticker']=='GMZPX','3-year Return (%)'] = '16.27'
df_mf.loc[df_mf['Ticker']=='GQESX','3-year Return (%)'] = '13.99'
df_mf.loc[df_mf['Ticker']=='GQLIX','3-year Return (%)'] = '13.92'
df_mf.loc[df_mf['Ticker']=='GQURX','3-year Return (%)'] = '13.7'
df_mf.loc[df_mf['Ticker']=='GSDPX','3-year Return (%)'] = '9.35'
df_mf.loc[df_mf['Ticker']=='GSEPX','3-year Return (%)'] = '10.02'
df_mf.loc[df_mf['Ticker']=='GSFPX','3-year Return (%)'] = '9.41'
df_mf.loc[df_mf['Ticker']=='GSPPX','3-year Return (%)'] = '21.7'
df_mf.loc[df_mf['Ticker']=='GSRFX','3-year Return (%)'] = '7.79'
df_mf.loc[df_mf['Ticker']=='GSVPX','3-year Return (%)'] = '5.67'
df_mf.loc[df_mf['Ticker']=='GSWPX','3-year Return (%)'] = '25.93'
df_mf.loc[df_mf['Ticker']=='GSXPX','3-year Return (%)'] = '4.77'
df_mf.loc[df_mf['Ticker']=='GSYPX','3-year Return (%)'] = '3.67'
df_mf.loc[df_mf['Ticker']=='GSZPX','3-year Return (%)'] = '12.49'
df_mf.loc[df_mf['Ticker']=='HLSCX','3-year Return (%)'] = '5.12'
df_mf.loc[df_mf['Ticker']=='HSMVX','3-year Return (%)'] = '5.65'
df_mf.loc[df_mf['Ticker']=='HVOVX','3-year Return (%)'] = '5.1'
df_mf.loc[df_mf['Ticker']=='HWLZX','3-year Return (%)'] = '2.02'
df_mf.loc[df_mf['Ticker']=='HWMZX','3-year Return (%)'] = '-2.73'
df_mf.loc[df_mf['Ticker']=='HWSZX','3-year Return (%)'] = '1.83'
df_mf.loc[df_mf['Ticker']=='HWVZX','3-year Return (%)'] = '3.52'
df_mf.loc[df_mf['Ticker']=='IATNX','3-year Return (%)'] = '21.62'
df_mf.loc[df_mf['Ticker']=='IOAPX','3-year Return (%)'] = '11.93'
df_mf.loc[df_mf['Ticker']=='IOVVX','3-year Return (%)'] = '3.27'
df_mf.loc[df_mf['Ticker']=='IRTCX','3-year Return (%)'] = '2.96'
df_mf.loc[df_mf['Ticker']=='JGRRX','3-year Return (%)'] = '17.2'
df_mf.loc[df_mf['Ticker']=='JIIGX','3-year Return (%)'] = '12.36'
df_mf.loc[df_mf['Ticker']=='JNVYX','3-year Return (%)'] = '9.06'
df_mf.loc[df_mf['Ticker']=='JPELX','3-year Return (%)'] = '14.03'
df_mf.loc[df_mf['Ticker']=='JPFRX','3-year Return (%)'] = '13.67'
df_mf.loc[df_mf['Ticker']=='JSCHX','3-year Return (%)'] = '16.65'
df_mf.loc[df_mf['Ticker']=='JSJAX','3-year Return (%)'] = '14.03'
df_mf.loc[df_mf['Ticker']=='JSJCX','3-year Return (%)'] = '13.19'
df_mf.loc[df_mf['Ticker']=='JSJFX','3-year Return (%)'] = '14.43'
df_mf.loc[df_mf['Ticker']=='JSJIX','3-year Return (%)'] = '14.3'
df_mf.loc[df_mf['Ticker']=='JSSGX','3-year Return (%)'] = '22.23'
df_mf.loc[df_mf['Ticker']=='KNGYX','3-year Return (%)'] = '7.64'
df_mf.loc[df_mf['Ticker']=='LCGJX','3-year Return (%)'] = '21.54'
df_mf.loc[df_mf['Ticker']=='LCLTX','3-year Return (%)'] = '32.15'
df_mf.loc[df_mf['Ticker']=='LCMGX','3-year Return (%)'] = '37.62'
df_mf.loc[df_mf['Ticker']=='LFMGX','3-year Return (%)'] = '38.86'
df_mf.loc[df_mf['Ticker']=='LFSFX','3-year Return (%)'] = '7.07'
df_mf.loc[df_mf['Ticker']=='LFVCX','3-year Return (%)'] = '6.01'
df_mf.loc[df_mf['Ticker']=='LMVOX','3-year Return (%)'] = '7.16'
df_mf.loc[df_mf['Ticker']=='LMVVX','3-year Return (%)'] = '7.12'
df_mf.loc[df_mf['Ticker']=='LMVWX','3-year Return (%)'] = '7.17'
df_mf.loc[df_mf['Ticker']=='LSMNX','3-year Return (%)'] = '17.63'
df_mf.loc[df_mf['Ticker']=='MADAX','3-year Return (%)'] = '7.45'
df_mf.loc[df_mf['Ticker']=='MASMX','3-year Return (%)'] = '10.8'
df_mf.loc[df_mf['Ticker']=='MAWDX','3-year Return (%)'] = '7.52'
df_mf.loc[df_mf['Ticker']=='MBIRX','3-year Return (%)'] = '46.93'
df_mf.loc[df_mf['Ticker']=='MCIMX','3-year Return (%)'] = '3.19'
df_mf.loc[df_mf['Ticker']=='MDCIX','3-year Return (%)'] = '11.09'
df_mf.loc[df_mf['Ticker']=='MDMIX','3-year Return (%)'] = '7.75'
df_mf.loc[df_mf['Ticker']=='MDVWX','3-year Return (%)'] = '5.12'
df_mf.loc[df_mf['Ticker']=='MDVZX','3-year Return (%)'] = '4.89'
df_mf.loc[df_mf['Ticker']=='MEYWX','3-year Return (%)'] = '15.17'
df_mf.loc[df_mf['Ticker']=='MGHRX','3-year Return (%)'] = '40.01'
df_mf.loc[df_mf['Ticker']=='MIVIX','3-year Return (%)'] = '11.87'
df_mf.loc[df_mf['Ticker']=='MKFOX','3-year Return (%)'] = '21.91'
df_mf.loc[df_mf['Ticker']=='MMIJX','3-year Return (%)'] = '4.22'
df_mf.loc[df_mf['Ticker']=='MMMMX','3-year Return (%)'] = '2.55'
df_mf.loc[df_mf['Ticker']=='MMMSX','3-year Return (%)'] = '3.32'
df_mf.loc[df_mf['Ticker']=='MNSQX','3-year Return (%)'] = '12.66'
df_mf.loc[df_mf['Ticker']=='MSAZX','3-year Return (%)'] = '11.92'
df_mf.loc[df_mf['Ticker']=='MSJFX','3-year Return (%)'] = '10.83'
df_mf.loc[df_mf['Ticker']=='MSMJX','3-year Return (%)'] = '8.13'
df_mf.loc[df_mf['Ticker']=='MVISX','3-year Return (%)'] = '20.88'
df_mf.loc[df_mf['Ticker']=='MXHAX','3-year Return (%)'] = '4.81'
df_mf.loc[df_mf['Ticker']=='NBMRX','3-year Return (%)'] = '-1.31'
df_mf.loc[df_mf['Ticker']=='NGRDX','3-year Return (%)'] = '17.83'
df_mf.loc[df_mf['Ticker']=='NRINX','3-year Return (%)'] = '13.94'
df_mf.loc[df_mf['Ticker']=='NRLCX','3-year Return (%)'] = '12.01'
df_mf.loc[df_mf['Ticker']=='NSCKX','3-year Return (%)'] = '9.65'
df_mf.loc[df_mf['Ticker']=='NSRSX','3-year Return (%)'] = '27.94'
df_mf.loc[df_mf['Ticker']=='NUEIX','3-year Return (%)'] = '13.08'
df_mf.loc[df_mf['Ticker']=='NWABX','3-year Return (%)'] = '12.91'
df_mf.loc[df_mf['Ticker']=='NWADX','3-year Return (%)'] = '15.05'
df_mf.loc[df_mf['Ticker']=='NWAEX','3-year Return (%)'] = '14.96'
df_mf.loc[df_mf['Ticker']=='NWALX','3-year Return (%)'] = '6.26'
df_mf.loc[df_mf['Ticker']=='NWANX','3-year Return (%)'] = '6.54'
df_mf.loc[df_mf['Ticker']=='NWAOX','3-year Return (%)'] = '6.45'
df_mf.loc[df_mf['Ticker']=='NWAPX','3-year Return (%)'] = '6.51'
df_mf.loc[df_mf['Ticker']=='OAZLX','3-year Return (%)'] = '-0.16'
df_mf.loc[df_mf['Ticker']=='OAZMX','3-year Return (%)'] = '5.81'
df_mf.loc[df_mf['Ticker']=='OFAVX','3-year Return (%)'] = '7.45'
df_mf.loc[df_mf['Ticker']=='OLVRX','3-year Return (%)'] = '5.29'
df_mf.loc[df_mf['Ticker']=='OLVTX','3-year Return (%)'] = '5'
df_mf.loc[df_mf['Ticker']=='OMYGX','3-year Return (%)'] = '6.75'
df_mf.loc[df_mf['Ticker']=='PBSRX','3-year Return (%)'] = '22.57'
df_mf.loc[df_mf['Ticker']=='PCEKX','3-year Return (%)'] = '11.13'
df_mf.loc[df_mf['Ticker']=='PCMSX','3-year Return (%)'] = '6.16'
df_mf.loc[df_mf['Ticker']=='PCMVX','3-year Return (%)'] = '5.65'
df_mf.loc[df_mf['Ticker']=='PEIJX','3-year Return (%)'] = '7.79'
df_mf.loc[df_mf['Ticker']=='PEMCX','3-year Return (%)'] = '10.3'
df_mf.loc[df_mf['Ticker']=='PGWTX','3-year Return (%)'] = '7.17'
df_mf.loc[df_mf['Ticker']=='PIOKX','3-year Return (%)'] = '14.94'
df_mf.loc[df_mf['Ticker']=='PLIEX','3-year Return (%)'] = '16.4'
df_mf.loc[df_mf['Ticker']=='PMYTX','3-year Return (%)'] = '11.93'
df_mf.loc[df_mf['Ticker']=='PNOTX','3-year Return (%)'] = '22.59'
df_mf.loc[df_mf['Ticker']=='PSLGX','3-year Return (%)'] = '18.04'
df_mf.loc[df_mf['Ticker']=='QRSAX','3-year Return (%)'] = '9.74'
df_mf.loc[df_mf['Ticker']=='QRSIX','3-year Return (%)'] = '9.74'
df_mf.loc[df_mf['Ticker']=='RLSMX','3-year Return (%)'] = '6.85'
df_mf.loc[df_mf['Ticker']=='RMOMX','3-year Return (%)'] = '14.64'
df_mf.loc[df_mf['Ticker']=='RSDQX','3-year Return (%)'] = '9.88'
df_mf.loc[df_mf['Ticker']=='RSMMX','3-year Return (%)'] = '20.24'
df_mf.loc[df_mf['Ticker']=='RSPMX','3-year Return (%)'] = '5.29'
df_mf.loc[df_mf['Ticker']=='RTDAX','3-year Return (%)'] = '9.37'
df_mf.loc[df_mf['Ticker']=='RTDCX','3-year Return (%)'] = '8.57'
df_mf.loc[df_mf['Ticker']=='SBRVX','3-year Return (%)'] = '8.62'
df_mf.loc[df_mf['Ticker']=='SCSIX','3-year Return (%)'] = '4.2'
df_mf.loc[df_mf['Ticker']=='SFMRX','3-year Return (%)'] = '20.68'
df_mf.loc[df_mf['Ticker']=='SLCSX','3-year Return (%)'] = '14.24'
df_mf.loc[df_mf['Ticker']=='SOIVX','3-year Return (%)'] = '10.03'
df_mf.loc[df_mf['Ticker']=='STRAX','3-year Return (%)'] = '1.05'
df_mf.loc[df_mf['Ticker']=='STRBX','3-year Return (%)'] = '0.23'
df_mf.loc[df_mf['Ticker']=='STREX','3-year Return (%)'] = '8.4'
df_mf.loc[df_mf['Ticker']=='STRMX','3-year Return (%)'] = '3.99'
df_mf.loc[df_mf['Ticker']=='STRSX','3-year Return (%)'] = '10.68'
df_mf.loc[df_mf['Ticker']=='STSRX','3-year Return (%)'] = '20.28'
df_mf.loc[df_mf['Ticker']=='TASZX','3-year Return (%)'] = '2.15'
df_mf.loc[df_mf['Ticker']=='TCPWX','3-year Return (%)'] = '38.15'
df_mf.loc[df_mf['Ticker']=='TDELX','3-year Return (%)'] = '12.79'
df_mf.loc[df_mf['Ticker']=='TDEYX','3-year Return (%)'] = '12.77'
df_mf.loc[df_mf['Ticker']=='TEQWX','3-year Return (%)'] = '13.14'
df_mf.loc[df_mf['Ticker']=='TFGRX','3-year Return (%)'] = '17.89'
df_mf.loc[df_mf['Ticker']=='TGIWX','3-year Return (%)'] = '12.15'
df_mf.loc[df_mf['Ticker']=='THCWX','3-year Return (%)'] = '4.88'
df_mf.loc[df_mf['Ticker']=='TILWX','3-year Return (%)'] = '21.52'
df_mf.loc[df_mf['Ticker']=='TISWX','3-year Return (%)'] = '12.41'
df_mf.loc[df_mf['Ticker']=='TRGOX','3-year Return (%)'] = '20.41'
df_mf.loc[df_mf['Ticker']=='TRHZX','3-year Return (%)'] = '12.28'
df_mf.loc[df_mf['Ticker']=='TRIWX','3-year Return (%)'] = '20.94'
df_mf.loc[df_mf['Ticker']=='TRJZX','3-year Return (%)'] = '18.72'
df_mf.loc[df_mf['Ticker']=='TRLUX','3-year Return (%)'] = '4.67'
df_mf.loc[df_mf['Ticker']=='TRLWX','3-year Return (%)'] = '3.27'
df_mf.loc[df_mf['Ticker']=='TRQZX','3-year Return (%)'] = '15.53'
df_mf.loc[df_mf['Ticker']=='TRTZX','3-year Return (%)'] = '5.38'
df_mf.loc[df_mf['Ticker']=='TRUZX','3-year Return (%)'] = '29.25'
df_mf.loc[df_mf['Ticker']=='TRZAX','3-year Return (%)'] = '7.74'
df_mf.loc[df_mf['Ticker']=='TRZLX','3-year Return (%)'] = '11.3'
df_mf.loc[df_mf['Ticker']=='TRZVX','3-year Return (%)'] = '8.89'
df_mf.loc[df_mf['Ticker']=='TRZZX','3-year Return (%)'] = '18.03'
df_mf.loc[df_mf['Ticker']=='TSCWX','3-year Return (%)'] = '9.27'
df_mf.loc[df_mf['Ticker']=='TSMUX','3-year Return (%)'] = '13.42'
df_mf.loc[df_mf['Ticker']=='TSNRX','3-year Return (%)'] = '28.79'
df_mf.loc[df_mf['Ticker']=='UANQX','3-year Return (%)'] = '24.69'
df_mf.loc[df_mf['Ticker']=='UCNQX','3-year Return (%)'] = '23.78'
df_mf.loc[df_mf['Ticker']=='UINQX','3-year Return (%)'] = '25'
df_mf.loc[df_mf['Ticker']=='VCGRX','3-year Return (%)'] = '20.83'
df_mf.loc[df_mf['Ticker']=='VECRX','3-year Return (%)'] = '7.85'
df_mf.loc[df_mf['Ticker']=='VFTAX','3-year Return (%)'] = '14.94'
df_mf.loc[df_mf['Ticker']=='VHDPX','3-year Return (%)'] = '6.62'
df_mf.loc[df_mf['Ticker']=='VHDRX','3-year Return (%)'] = '6.15'
df_mf.loc[df_mf['Ticker']=='VHYAX','3-year Return (%)'] = '4.58'
df_mf.loc[df_mf['Ticker']=='VILSX','3-year Return (%)'] = '16.39'
df_mf.loc[df_mf['Ticker']=='VIPAX','3-year Return (%)'] = '10.33'
df_mf.loc[df_mf['Ticker']=='VLVPX','3-year Return (%)'] = '5.89'
df_mf.loc[df_mf['Ticker']=='VMMCX','3-year Return (%)'] = '3.82'
df_mf.loc[df_mf['Ticker']=='VMMPX','3-year Return (%)'] = '4.04'
df_mf.loc[df_mf['Ticker']=='VPLCX','3-year Return (%)'] = '18.51'
df_mf.loc[df_mf['Ticker']=='VPMOX','3-year Return (%)'] = '17.98'
df_mf.loc[df_mf['Ticker']=='VRMCX','3-year Return (%)'] = '14.3'
df_mf.loc[df_mf['Ticker']=='VRMGX','3-year Return (%)'] = '32.36'
df_mf.loc[df_mf['Ticker']=='VRSGX','3-year Return (%)'] = '28.03'
df_mf.loc[df_mf['Ticker']=='VSOPX','3-year Return (%)'] = '11.23'
df_mf.loc[df_mf['Ticker']=='VSRAX','3-year Return (%)'] = '2.53'
df_mf.loc[df_mf['Ticker']=='VVERX','3-year Return (%)'] = '2.41'
df_mf.loc[df_mf['Ticker']=='VVILX','3-year Return (%)'] = '10.81'
df_mf.loc[df_mf['Ticker']=='VVISX','3-year Return (%)'] = '5.7'
df_mf.loc[df_mf['Ticker']=='VYCEX','3-year Return (%)'] = '9.34'
df_mf.loc[df_mf['Ticker']=='VYMUX','3-year Return (%)'] = '6.65'
df_mf.loc[df_mf['Ticker']=='VYSCX','3-year Return (%)'] = '7.13'
df_mf.loc[df_mf['Ticker']=='VZGRX','3-year Return (%)'] = '47.21'
df_mf.loc[df_mf['Ticker']=='WBSRX','3-year Return (%)'] = '19.57'
df_mf.loc[df_mf['Ticker']=='WCGJX','3-year Return (%)'] = '17.56'
df_mf.loc[df_mf['Ticker']=='WDSAX','3-year Return (%)'] = '6'
df_mf.loc[df_mf['Ticker']=='WECRX','3-year Return (%)'] = '21.45'
df_mf.loc[df_mf['Ticker']=='WEGRX','3-year Return (%)'] = '27.48'
df_mf.loc[df_mf['Ticker']=='WFICX','3-year Return (%)'] = '1.42'
df_mf.loc[df_mf['Ticker']=='WFSJX','3-year Return (%)'] = '5.77'
df_mf.loc[df_mf['Ticker']=='WGICX','3-year Return (%)'] = '36.34'
df_mf.loc[df_mf['Ticker']=='WGMCX','3-year Return (%)'] = '38.44'
df_mf.loc[df_mf['Ticker']=='WGMVX','3-year Return (%)'] = '21.84'
df_mf.loc[df_mf['Ticker']=='WHGAX','3-year Return (%)'] = '4.56'
df_mf.loc[df_mf['Ticker']=='WHGCX','3-year Return (%)'] = '3.81'
df_mf.loc[df_mf['Ticker']=='WOFRX','3-year Return (%)'] = '11.92'
df_mf.loc[df_mf['Ticker']=='WSMRX','3-year Return (%)'] = '18.63'
df_mf.loc[df_mf['Ticker']=='WWLCX','3-year Return (%)'] = '4.9'
df_mf.loc[df_mf['Ticker']=='WWSMX','3-year Return (%)'] = '6.5'
df_mf.loc[df_mf['Ticker']=='WWSYX','3-year Return (%)'] = '4.8'
df_mf.loc[df_mf['Ticker']=='EARFX','3-year Return (%)'] = '-0.18'

In [19]:
df_mf.drop(df_mf[df_mf['3-year Return (%)']=='--'].index, inplace=True)

In [20]:
df_mf.loc[df_mf['Ticker']=='ADNRX','Expense Ratio (%)'] ='0.96'
df_mf.loc[df_mf['Ticker']=='CGRGX','Expense Ratio (%)'] ='0.42'
df_mf.loc[df_mf['Ticker']=='DLCEX','Expense Ratio (%)'] ='0.98'
df_mf.loc[df_mf['Ticker']=='DLCIX','Expense Ratio (%)'] ='0.73'
df_mf.loc[df_mf['Ticker']=='DSCIX','Expense Ratio (%)'] ='0.95'
df_mf.loc[df_mf['Ticker']=='EGWRX','Expense Ratio (%)'] ='0.81'
df_mf.loc[df_mf['Ticker']=='ESGIX','Expense Ratio (%)'] ='0.85'
df_mf.loc[df_mf['Ticker']=='FAFGX','Expense Ratio (%)'] ='0.43'
df_mf.loc[df_mf['Ticker']=='FAOOX','Expense Ratio (%)'] ='0.33'
df_mf.loc[df_mf['Ticker']=='FCIAX','Expense Ratio (%)'] ='0.39'
df_mf.loc[df_mf['Ticker']=='FEEFX','Expense Ratio (%)'] ='0.34'
df_mf.loc[df_mf['Ticker']=='FFAFX','Expense Ratio (%)'] ='0.36'
df_mf.loc[df_mf['Ticker']=='FFFMX','Expense Ratio (%)'] ='0.33'
df_mf.loc[df_mf['Ticker']=='FFMMX','Expense Ratio (%)'] ='0.38'
df_mf.loc[df_mf['Ticker']=='FFNPX','Expense Ratio (%)'] ='0'
df_mf.loc[df_mf['Ticker']=='FFXFX','Expense Ratio (%)'] ='0.40'
df_mf.loc[df_mf['Ticker']=='FGPGX','Expense Ratio (%)'] ='0.53'
df_mf.loc[df_mf['Ticker']=='FLCLX','Expense Ratio (%)'] ='0'
df_mf.loc[df_mf['Ticker']=='FMCMX','Expense Ratio (%)'] ='0.40'
df_mf.loc[df_mf['Ticker']=='FMMMX','Expense Ratio (%)'] ='0.47'
df_mf.loc[df_mf['Ticker']=='FPGGX','Expense Ratio (%)'] ='0.43'
df_mf.loc[df_mf['Ticker']=='FSBDX','Expense Ratio (%)'] ='0'
df_mf.loc[df_mf['Ticker']=='FSOPX','Expense Ratio (%)'] ='0'
df_mf.loc[df_mf['Ticker']=='FWMMX','Expense Ratio (%)'] ='0.38'
df_mf.loc[df_mf['Ticker']=='FWWMX','Expense Ratio (%)'] ='0.33'
df_mf.loc[df_mf['Ticker']=='GSQTX','Expense Ratio (%)'] ='1.03'
df_mf.loc[df_mf['Ticker']=='HLSCX','Expense Ratio (%)'] ='1.11'
df_mf.loc[df_mf['Ticker']=='JAVTX','Expense Ratio (%)'] ='0.91'
df_mf.loc[df_mf['Ticker']=='JIIGX','Expense Ratio (%)'] ='0.34'
df_mf.loc[df_mf['Ticker']=='JSSGX','Expense Ratio (%)'] ='1.09'
df_mf.loc[df_mf['Ticker']=='MGTIX','Expense Ratio (%)'] ='0.47'
df_mf.loc[df_mf['Ticker']=='MIGKX','Expense Ratio (%)'] ='0.47'
df_mf.loc[df_mf['Ticker']=='MIGNX','Expense Ratio (%)'] ='0.38'
df_mf.loc[df_mf['Ticker']=='MIRTX','Expense Ratio (%)'] ='0.96'
df_mf.loc[df_mf['Ticker']=='MITDX','Expense Ratio (%)'] ='0.46'
df_mf.loc[df_mf['Ticker']=='MITGX','Expense Ratio (%)'] ='1.46'
df_mf.loc[df_mf['Ticker']=='MITHX','Expense Ratio (%)'] ='0.71'
df_mf.loc[df_mf['Ticker']=='MITIX','Expense Ratio (%)'] ='0.46'
df_mf.loc[df_mf['Ticker']=='MITJX','Expense Ratio (%)'] ='0.38'
df_mf.loc[df_mf['Ticker']=='MMIJX','Expense Ratio (%)'] ='0.85'
df_mf.loc[df_mf['Ticker']=='MMMMX','Expense Ratio (%)'] ='1.40'
df_mf.loc[df_mf['Ticker']=='MMMSX','Expense Ratio (%)'] ='0.95'
df_mf.loc[df_mf['Ticker']=='NSCKX','Expense Ratio (%)'] ='0.50'
df_mf.loc[df_mf['Ticker']=='NUEIX','Expense Ratio (%)'] ='0.49'
df_mf.loc[df_mf['Ticker']=='OAZLX','Expense Ratio (%)'] ='0.75'
df_mf.loc[df_mf['Ticker']=='OAZMX','Expense Ratio (%)'] ='0.63'
df_mf.loc[df_mf['Ticker']=='PLIEX','Expense Ratio (%)'] ='1.00'
df_mf.loc[df_mf['Ticker']=='QRSAX','Expense Ratio (%)'] ='0.99'
df_mf.loc[df_mf['Ticker']=='QRSIX','Expense Ratio (%)'] ='0.89'
df_mf.loc[df_mf['Ticker']=='RLSMX','Expense Ratio (%)'] ='0.92'
df_mf.loc[df_mf['Ticker']=='RMOMX','Expense Ratio (%)'] ='1.05'
df_mf.loc[df_mf['Ticker']=='RSMMX','Expense Ratio (%)'] ='1.15'
df_mf.loc[df_mf['Ticker']=='RSPMX','Expense Ratio (%)'] ='1.25'
df_mf.loc[df_mf['Ticker']=='SLCGX','Expense Ratio (%)'] ='1.12'
df_mf.loc[df_mf['Ticker']=='SLCVX','Expense Ratio (%)'] ='1.18'
df_mf.loc[df_mf['Ticker']=='SMIPX','Expense Ratio (%)'] ='1.46'
df_mf.loc[df_mf['Ticker']=='SOIVX','Expense Ratio (%)'] ='1.22'
df_mf.loc[df_mf['Ticker']=='SSCPX','Expense Ratio (%)'] ='1.69'
df_mf.loc[df_mf['Ticker']=='TRGOX','Expense Ratio (%)'] ='0.70'
df_mf.loc[df_mf['Ticker']=='TRHZX','Expense Ratio (%)'] ='0'
df_mf.loc[df_mf['Ticker']=='TRJZX','Expense Ratio (%)'] ='0'
df_mf.loc[df_mf['Ticker']=='TRLUX','Expense Ratio (%)'] ='0.70'
df_mf.loc[df_mf['Ticker']=='TRQZX','Expense Ratio (%)'] ='0'
df_mf.loc[df_mf['Ticker']=='TRTZX','Expense Ratio (%)'] ='0'
df_mf.loc[df_mf['Ticker']=='TRUZX','Expense Ratio (%)'] ='0'
df_mf.loc[df_mf['Ticker']=='TRZAX','Expense Ratio (%)'] ='0'
df_mf.loc[df_mf['Ticker']=='TRZLX','Expense Ratio (%)'] ='0'
df_mf.loc[df_mf['Ticker']=='TRZVX','Expense Ratio (%)'] ='0.06'
df_mf.loc[df_mf['Ticker']=='TRZZX','Expense Ratio (%)'] ='0.01'
df_mf.loc[df_mf['Ticker']=='UANQX','Expense Ratio (%)'] ='0.70'
df_mf.loc[df_mf['Ticker']=='UCNQX','Expense Ratio (%)'] ='1.45'
df_mf.loc[df_mf['Ticker']=='UINQX','Expense Ratio (%)'] ='0.44'
df_mf.loc[df_mf['Ticker']=='VDEQX','Expense Ratio (%)'] ='0.35'
df_mf.loc[df_mf['Ticker']=='VILSX','Expense Ratio (%)'] ='0.91'
df_mf.loc[df_mf['Ticker']=='VZGRX','Expense Ratio (%)'] ='0.90'
df_mf.loc[df_mf['Ticker']=='WFSJX','Expense Ratio (%)'] ='0.90'
df_mf.loc[df_mf['Ticker']=='WWSYX','Expense Ratio (%)'] ='0.79'

In [21]:
df_mf.loc[df_mf['Ticker']=='AAWVX','Total Assets ($ mil)'] =1
df_mf.loc[df_mf['Ticker']=='ACFNX','Total Assets ($ mil)'] =2100
df_mf.loc[df_mf['Ticker']=='AFGFX','Total Assets ($ mil)'] =1300
df_mf.loc[df_mf['Ticker']=='AGRYX','Total Assets ($ mil)'] =1500
df_mf.loc[df_mf['Ticker']=='ALFQX','Total Assets ($ mil)'] =825
df_mf.loc[df_mf['Ticker']=='BOSVX','Total Assets ($ mil)'] =1100
df_mf.loc[df_mf['Ticker']=='CSCRX','Total Assets ($ mil)'] =2700
df_mf.loc[df_mf['Ticker']=='CSMSX','Total Assets ($ mil)'] =3400
df_mf.loc[df_mf['Ticker']=='DLACX','Total Assets ($ mil)'] =835
df_mf.loc[df_mf['Ticker']=='DTMVX','Total Assets ($ mil)'] =5000
df_mf.loc[df_mf['Ticker']=='DUZRX','Total Assets ($ mil)'] =2700
df_mf.loc[df_mf['Ticker']=='EGORX','Total Assets ($ mil)'] =487
df_mf.loc[df_mf['Ticker']=='FBLEX','Total Assets ($ mil)'] =11000
df_mf.loc[df_mf['Ticker']=='FCMVX','Total Assets ($ mil)'] =39
df_mf.loc[df_mf['Ticker']=='FCTGX','Total Assets ($ mil)'] =5400
df_mf.loc[df_mf['Ticker']=='FDESX','Total Assets ($ mil)'] =2600
df_mf.loc[df_mf['Ticker']=='FKKSX','Total Assets ($ mil)'] =10500
df_mf.loc[df_mf['Ticker']=='FSKGX','Total Assets ($ mil)'] =186
df_mf.loc[df_mf['Ticker']=='FSLZX','Total Assets ($ mil)'] =2000
df_mf.loc[df_mf['Ticker']=='FTGRX','Total Assets ($ mil)'] =1300
df_mf.loc[df_mf['Ticker']=='FVLKX','Total Assets ($ mil)'] =6600
df_mf.loc[df_mf['Ticker']=='GCMRX','Total Assets ($ mil)'] =1100
df_mf.loc[df_mf['Ticker']=='GMZPX','Total Assets ($ mil)'] =2000
df_mf.loc[df_mf['Ticker']=='GNWRX','Total Assets ($ mil)'] =1200
df_mf.loc[df_mf['Ticker']=='GRGVX','Total Assets ($ mil)'] =12
df_mf.loc[df_mf['Ticker']=='GTMTX','Total Assets ($ mil)'] =3000
df_mf.loc[df_mf['Ticker']=='HBSGX','Total Assets ($ mil)'] =1400
df_mf.loc[df_mf['Ticker']=='HFMRX','Total Assets ($ mil)'] =15300
df_mf.loc[df_mf['Ticker']=='HVOTX','Total Assets ($ mil)'] =191
df_mf.loc[df_mf['Ticker']=='IASAX','Total Assets ($ mil)'] =348
df_mf.loc[df_mf['Ticker']=='IEOTX','Total Assets ($ mil)'] =6300
df_mf.loc[df_mf['Ticker']=='IHSVX','Total Assets ($ mil)'] =927
df_mf.loc[df_mf['Ticker']=='IJMIX','Total Assets ($ mil)'] =371
df_mf.loc[df_mf['Ticker']=='IRVSX','Total Assets ($ mil)'] =844
df_mf.loc[df_mf['Ticker']=='ITHTX','Total Assets ($ mil)'] =7100
df_mf.loc[df_mf['Ticker']=='IYGIX','Total Assets ($ mil)'] =5700
df_mf.loc[df_mf['Ticker']=='JICPX','Total Assets ($ mil)'] =2100
df_mf.loc[df_mf['Ticker']=='JLGRX','Total Assets ($ mil)'] =32900
df_mf.loc[df_mf['Ticker']=='JMGPX','Total Assets ($ mil)'] =7900
df_mf.loc[df_mf['Ticker']=='JSSOX','Total Assets ($ mil)'] =386
df_mf.loc[df_mf['Ticker']=='LAMTX','Total Assets ($ mil)'] =2800
df_mf.loc[df_mf['Ticker']=='LCBVX','Total Assets ($ mil)'] =1700
df_mf.loc[df_mf['Ticker']=='LGLOX','Total Assets ($ mil)'] =8600
df_mf.loc[df_mf['Ticker']=='LMVRX','Total Assets ($ mil)'] =1800
df_mf.loc[df_mf['Ticker']=='LOVLX','Total Assets ($ mil)'] =1300
df_mf.loc[df_mf['Ticker']=='LVOQX','Total Assets ($ mil)'] =1600
df_mf.loc[df_mf['Ticker']=='MAEIX','Total Assets ($ mil)'] =3700
df_mf.loc[df_mf['Ticker']=='MCJYX','Total Assets ($ mil)'] =324
df_mf.loc[df_mf['Ticker']=='MFRLX','Total Assets ($ mil)'] =6900
df_mf.loc[df_mf['Ticker']=='MGRSX','Total Assets ($ mil)'] =516
df_mf.loc[df_mf['Ticker']=='MIRTX','Total Assets ($ mil)'] =6400
df_mf.loc[df_mf['Ticker']=='MLVMX','Total Assets ($ mil)'] =580
df_mf.loc[df_mf['Ticker']=='MMFVX','Total Assets ($ mil)'] =743
df_mf.loc[df_mf['Ticker']=='MMQIX','Total Assets ($ mil)'] =91
df_mf.loc[df_mf['Ticker']=='MRGHX','Total Assets ($ mil)'] =4700
df_mf.loc[df_mf['Ticker']=='MSSRX','Total Assets ($ mil)'] =116
df_mf.loc[df_mf['Ticker']=='MUERX','Total Assets ($ mil)'] =1200
df_mf.loc[df_mf['Ticker']=='MVCHX','Total Assets ($ mil)'] =11700
df_mf.loc[df_mf['Ticker']=='MXKJX','Total Assets ($ mil)'] =710
df_mf.loc[df_mf['Ticker']=='OISGX','Total Assets ($ mil)'] =725
df_mf.loc[df_mf['Ticker']=='PCANX','Total Assets ($ mil)'] =2000
df_mf.loc[df_mf['Ticker']=='PGIAX','Total Assets ($ mil)'] =731
df_mf.loc[df_mf['Ticker']=='PGWIX','Total Assets ($ mil)'] =263
df_mf.loc[df_mf['Ticker']=='PLVIX','Total Assets ($ mil)'] =2300
df_mf.loc[df_mf['Ticker']=='PNSAX','Total Assets ($ mil)'] =777
df_mf.loc[df_mf['Ticker']=='PQIRX','Total Assets ($ mil)'] =2300
df_mf.loc[df_mf['Ticker']=='PSCHX','Total Assets ($ mil)'] =1900
df_mf.loc[df_mf['Ticker']=='PSSIX','Total Assets ($ mil)'] =1300
df_mf.loc[df_mf['Ticker']=='RLCOX','Total Assets ($ mil)'] =233
df_mf.loc[df_mf['Ticker']=='RMORX','Total Assets ($ mil)'] =591
df_mf.loc[df_mf['Ticker']=='RSGSX','Total Assets ($ mil)'] =154
df_mf.loc[df_mf['Ticker']=='SWSCX','Total Assets ($ mil)'] =627
df_mf.loc[df_mf['Ticker']=='TCPWX','Total Assets ($ mil)'] =5100
df_mf.loc[df_mf['Ticker']=='TEQWX','Total Assets ($ mil)'] =30700
df_mf.loc[df_mf['Ticker']=='TOTRX','Total Assets ($ mil)'] =1600
df_mf.loc[df_mf['Ticker']=='TRLCX','Total Assets ($ mil)'] =5100
df_mf.loc[df_mf['Ticker']=='TVRFX','Total Assets ($ mil)'] =806
df_mf.loc[df_mf['Ticker']=='VCGAX','Total Assets ($ mil)'] =156
df_mf.loc[df_mf['Ticker']=='VRMGX','Total Assets ($ mil)'] =3300

In [22]:
df_mf.loc[df_mf['Ticker']=='AAWVX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='ACCLX','Minimum Initial Purchase ($)'] =2500
df_mf.loc[df_mf['Ticker']=='ACFNX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='ACGCX','Minimum Initial Purchase ($)'] =2500
df_mf.loc[df_mf['Ticker']=='ACGQX','Minimum Initial Purchase ($)'] =1000000
df_mf.loc[df_mf['Ticker']=='ACSHX','Minimum Initial Purchase ($)'] =1000000
df_mf.loc[df_mf['Ticker']=='ADGZX','Minimum Initial Purchase ($)'] =2000000
df_mf.loc[df_mf['Ticker']=='AFDIX','Minimum Initial Purchase ($)'] =2500
df_mf.loc[df_mf['Ticker']=='AFGFX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='AGRYX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='AISZX','Minimum Initial Purchase ($)'] =500000
df_mf.loc[df_mf['Ticker']=='AIVSX','Minimum Initial Purchase ($)'] =250
df_mf.loc[df_mf['Ticker']=='ALFQX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='AMCSX','Minimum Initial Purchase ($)'] =2500
df_mf.loc[df_mf['Ticker']=='AMGAX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='AMRFX','Minimum Initial Purchase ($)'] =250
df_mf.loc[df_mf['Ticker']=='ANONX','Minimum Initial Purchase ($)'] =5000000
df_mf.loc[df_mf['Ticker']=='ARSKX','Minimum Initial Purchase ($)'] =2500
df_mf.loc[df_mf['Ticker']=='ARTSX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='BCIFX','Minimum Initial Purchase ($)'] =5000
df_mf.loc[df_mf['Ticker']=='BDSIX','Minimum Initial Purchase ($)'] =2000000
df_mf.loc[df_mf['Ticker']=='BFGIX','Minimum Initial Purchase ($)'] =1000000
df_mf.loc[df_mf['Ticker']=='BIAUX','Minimum Initial Purchase ($)'] =100
df_mf.loc[df_mf['Ticker']=='BOSOX','Minimum Initial Purchase ($)'] =100000
df_mf.loc[df_mf['Ticker']=='BOSVX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='BRSWX','Minimum Initial Purchase ($)'] =250
df_mf.loc[df_mf['Ticker']=='BSCVX','Minimum Initial Purchase ($)'] =25000
df_mf.loc[df_mf['Ticker']=='BSPGX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='BSPIX','Minimum Initial Purchase ($)'] =2000000
df_mf.loc[df_mf['Ticker']=='CAFFX','Minimum Initial Purchase ($)'] =250
df_mf.loc[df_mf['Ticker']=='CBECX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='CBSAX','Minimum Initial Purchase ($)'] =2000
df_mf.loc[df_mf['Ticker']=='CCASX','Minimum Initial Purchase ($)'] =2500
df_mf.loc[df_mf['Ticker']=='CGPEX','Minimum Initial Purchase ($)'] =250
df_mf.loc[df_mf['Ticker']=='CHASX','Minimum Initial Purchase ($)'] =2000
df_mf.loc[df_mf['Ticker']=='CIDVX','Minimum Initial Purchase ($)'] =1000000
df_mf.loc[df_mf['Ticker']=='CRMMX','Minimum Initial Purchase ($)'] =2500
df_mf.loc[df_mf['Ticker']=='CSCRX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='CSMSX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='CSXCX','Minimum Initial Purchase ($)'] =5000
df_mf.loc[df_mf['Ticker']=='DCCCX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='DDFIX','Minimum Initial Purchase ($)'] =1000000
df_mf.loc[df_mf['Ticker']=='DHTYX','Minimum Initial Purchase ($)'] =500000
df_mf.loc[df_mf['Ticker']=='DLACX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='DMVAX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='DNLRX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='DRDIX','Minimum Initial Purchase ($)'] =500000
df_mf.loc[df_mf['Ticker']=='DTCAX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='DTMVX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='DUZRX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='EAGCX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='ECOLX','Minimum Initial Purchase ($)'] =2500
df_mf.loc[df_mf['Ticker']=='ECSTX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='EDFWX','Minimum Initial Purchase ($)'] =50000
df_mf.loc[df_mf['Ticker']=='EGORX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='EIMGX','Minimum Initial Purchase ($)'] =250000
df_mf.loc[df_mf['Ticker']=='ENSBX','Minimum Initial Purchase ($)'] =5000
df_mf.loc[df_mf['Ticker']=='ESGIX','Minimum Initial Purchase ($)'] =100000
df_mf.loc[df_mf['Ticker']=='ESPAX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='EVSTX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='FACSX','Minimum Initial Purchase ($)'] =3000
df_mf.loc[df_mf['Ticker']=='FBLEX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='FCMVX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='FCTGX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='FDESX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='FFIOX','Minimum Initial Purchase ($)'] =2000
df_mf.loc[df_mf['Ticker']=='FFQRX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='FKKSX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='FSGRX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='FSKGX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='FSLZX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='FTGRX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='FTVNX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='FVLKX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='GBCCX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='GBSAX','Minimum Initial Purchase ($)'] =2500
df_mf.loc[df_mf['Ticker']=='GCLLX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='GCMRX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='GENIX','Minimum Initial Purchase ($)'] =250000
df_mf.loc[df_mf['Ticker']=='GMZPX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='GNWRX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='GRGVX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='GSCIX','Minimum Initial Purchase ($)'] =1000000
df_mf.loc[df_mf['Ticker']=='GTMTX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='GVCIX','Minimum Initial Purchase ($)'] =250000
df_mf.loc[df_mf['Ticker']=='GWEZX','Minimum Initial Purchase ($)'] =5000000
df_mf.loc[df_mf['Ticker']=='HBSGX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='HDGYX','Minimum Initial Purchase ($)'] =250000
df_mf.loc[df_mf['Ticker']=='HEQCX','Minimum Initial Purchase ($)'] =1000000
df_mf.loc[df_mf['Ticker']=='HFMDX','Minimum Initial Purchase ($)'] =2500
df_mf.loc[df_mf['Ticker']=='HFMRX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='HHDFX','Minimum Initial Purchase ($)'] =100000
df_mf.loc[df_mf['Ticker']=='HNDDX','Minimum Initial Purchase ($)'] =2500
df_mf.loc[df_mf['Ticker']=='HNMVX','Minimum Initial Purchase ($)'] =1000000
df_mf.loc[df_mf['Ticker']=='HRCVX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='HULIX','Minimum Initial Purchase ($)'] =5000
df_mf.loc[df_mf['Ticker']=='HVOTX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='IASAX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='IDANX','Minimum Initial Purchase ($)'] =1000000
df_mf.loc[df_mf['Ticker']=='IEOTX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='IHSVX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='IJMIX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='IRVSX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='ITHTX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='IYGIX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='JAPAX','Minimum Initial Purchase ($)'] =2500
df_mf.loc[df_mf['Ticker']=='JBGCX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='JCSCX','Minimum Initial Purchase ($)'] =2500
df_mf.loc[df_mf['Ticker']=='JDEAX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='JGACX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='JHKAX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='JICPX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='JLGRX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='JMGPX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='JRSDX','Minimum Initial Purchase ($)'] =2500
df_mf.loc[df_mf['Ticker']=='JSSOX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='JSSSX','Minimum Initial Purchase ($)'] =1000000
df_mf.loc[df_mf['Ticker']=='JSVAX','Minimum Initial Purchase ($)'] =2500
df_mf.loc[df_mf['Ticker']=='JVACX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='KSOAX','Minimum Initial Purchase ($)'] =2500
df_mf.loc[df_mf['Ticker']=='LAMTX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='LCBVX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='LCGJX','Minimum Initial Purchase ($)'] =1000000
df_mf.loc[df_mf['Ticker']=='LCIAX','Minimum Initial Purchase ($)'] =100000
df_mf.loc[df_mf['Ticker']=='LDVCX','Minimum Initial Purchase ($)'] =2500
df_mf.loc[df_mf['Ticker']=='LEGCX','Minimum Initial Purchase ($)'] =2000
df_mf.loc[df_mf['Ticker']=='LEVOX','Minimum Initial Purchase ($)'] =2500
df_mf.loc[df_mf['Ticker']=='LGLOX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='LMVRX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='LOVLX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='LSSIX','Minimum Initial Purchase ($)'] =100000
df_mf.loc[df_mf['Ticker']=='LVOQX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='LVPIX','Minimum Initial Purchase ($)'] =15000
df_mf.loc[df_mf['Ticker']=='MADVX','Minimum Initial Purchase ($)'] =2000000
df_mf.loc[df_mf['Ticker']=='MAEIX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='MCJYX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='MDCIX','Minimum Initial Purchase ($)'] =250000
df_mf.loc[df_mf['Ticker']=='MFCIX','Minimum Initial Purchase ($)'] =2500
df_mf.loc[df_mf['Ticker']=='MFRLX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='MGRSX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='MIDIX','Minimum Initial Purchase ($)'] =1000000
df_mf.loc[df_mf['Ticker']=='MIRTX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='MLVMX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='MMEAX','Minimum Initial Purchase ($)'] =2500
df_mf.loc[df_mf['Ticker']=='MMFVX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='MMQIX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='MNNCX','Minimum Initial Purchase ($)'] =2500
df_mf.loc[df_mf['Ticker']=='MNRMX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='MRGHX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='MRLIX','Minimum Initial Purchase ($)'] =5000000
df_mf.loc[df_mf['Ticker']=='MSEFX','Minimum Initial Purchase ($)'] =10000
df_mf.loc[df_mf['Ticker']=='MSSMX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='MSSRX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='MUERX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='MUXAX','Minimum Initial Purchase ($)'] =2500
df_mf.loc[df_mf['Ticker']=='MVCHX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='MXKJX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='NBMLX','Minimum Initial Purchase ($)'] =1000000
df_mf.loc[df_mf['Ticker']=='NCBVX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='NDGIX','Minimum Initial Purchase ($)'] =1000000
df_mf.loc[df_mf['Ticker']=='NESNX','Minimum Initial Purchase ($)'] =1000000
df_mf.loc[df_mf['Ticker']=='NEXTX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='NGQAX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='NSBFX','Minimum Initial Purchase ($)'] =1000000
df_mf.loc[df_mf['Ticker']=='NSPAX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='NUESX','Minimum Initial Purchase ($)'] =2500
df_mf.loc[df_mf['Ticker']=='NWHZX','Minimum Initial Purchase ($)'] =2000
df_mf.loc[df_mf['Ticker']=='OAYLX','Minimum Initial Purchase ($)'] =100000
df_mf.loc[df_mf['Ticker']=='OISGX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='OSCAX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='OVECX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='PBSRX','Minimum Initial Purchase ($)'] =3000
df_mf.loc[df_mf['Ticker']=='PCANX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='PCVAX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='PECAX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='PFPCX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='PGIAX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='PGWIX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='PJGCX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='PLVIX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='PNSAX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='PQIRX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='PRCGX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='PSCHX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='PSSIX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='PVEJX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='PZIMX','Minimum Initial Purchase ($)'] =1000000
df_mf.loc[df_mf['Ticker']=='QASCX','Minimum Initial Purchase ($)'] =1500
df_mf.loc[df_mf['Ticker']=='RFNEX','Minimum Initial Purchase ($)'] =250
df_mf.loc[df_mf['Ticker']=='RLCOX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='RMORX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='RPMIX','Minimum Initial Purchase ($)'] =1000000
df_mf.loc[df_mf['Ticker']=='RSGSX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='RWMBX','Minimum Initial Purchase ($)'] =250
df_mf.loc[df_mf['Ticker']=='RYLGX','Minimum Initial Purchase ($)'] =2500
df_mf.loc[df_mf['Ticker']=='RYTFX','Minimum Initial Purchase ($)'] =2000
df_mf.loc[df_mf['Ticker']=='SCRLX','Minimum Initial Purchase ($)'] =500000
df_mf.loc[df_mf['Ticker']=='SCRYX','Minimum Initial Purchase ($)'] =5000
df_mf.loc[df_mf['Ticker']=='SCSMX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='SHAPX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='SLGCX','Minimum Initial Purchase ($)'] =250
df_mf.loc[df_mf['Ticker']=='SLVAX','Minimum Initial Purchase ($)'] =2000
df_mf.loc[df_mf['Ticker']=='SMEAX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='SMGIX','Minimum Initial Purchase ($)'] =2000
df_mf.loc[df_mf['Ticker']=='SMVLX','Minimum Initial Purchase ($)'] =3000
df_mf.loc[df_mf['Ticker']=='SPWAX','Minimum Initial Purchase ($)'] =2500
df_mf.loc[df_mf['Ticker']=='SSPSX','Minimum Initial Purchase ($)'] =5000000
df_mf.loc[df_mf['Ticker']=='STVTX','Minimum Initial Purchase ($)'] =100000
df_mf.loc[df_mf['Ticker']=='SUWCX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='SVTIX','Minimum Initial Purchase ($)'] =5000
df_mf.loc[df_mf['Ticker']=='SWSCX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='TCPWX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='TDFAX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='TEQWX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='TISPX','Minimum Initial Purchase ($)'] =10000000
df_mf.loc[df_mf['Ticker']=='TMMAX','Minimum Initial Purchase ($)'] =100000
df_mf.loc[df_mf['Ticker']=='TNVAX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='TOTRX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='TPLGX','Minimum Initial Purchase ($)'] =1000000
df_mf.loc[df_mf['Ticker']=='TPLNX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='TQSAX','Minimum Initial Purchase ($)'] =2500
df_mf.loc[df_mf['Ticker']=='TRLCX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='TRULX','Minimum Initial Purchase ($)'] =2500
df_mf.loc[df_mf['Ticker']=='TSNCX','Minimum Initial Purchase ($)'] =2500
df_mf.loc[df_mf['Ticker']=='TVRFX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='UBVSX','Minimum Initial Purchase ($)'] =1000000
df_mf.loc[df_mf['Ticker']=='UCNQX','Minimum Initial Purchase ($)'] =2500
df_mf.loc[df_mf['Ticker']=='USMVX','Minimum Initial Purchase ($)'] =1000000
df_mf.loc[df_mf['Ticker']=='VAFNX','Minimum Initial Purchase ($)'] =1000000
df_mf.loc[df_mf['Ticker']=='VALUX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='VCGAX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='VDEQX','Minimum Initial Purchase ($)'] =3000
df_mf.loc[df_mf['Ticker']=='VFFSX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='VLCAX','Minimum Initial Purchase ($)'] =3000
df_mf.loc[df_mf['Ticker']=='VOLMX','Minimum Initial Purchase ($)'] =500
df_mf.loc[df_mf['Ticker']=='VRMGX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='VSEAX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='VSEMX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='VSFAX','Minimum Initial Purchase ($)'] =1500
df_mf.loc[df_mf['Ticker']=='VSMPX','Minimum Initial Purchase ($)'] =100000000
df_mf.loc[df_mf['Ticker']=='VSPVX','Minimum Initial Purchase ($)'] =5000000
df_mf.loc[df_mf['Ticker']=='VSTSX','Minimum Initial Purchase ($)'] =0
df_mf.loc[df_mf['Ticker']=='VYMYX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='WEEIX','Minimum Initial Purchase ($)'] =500000
df_mf.loc[df_mf['Ticker']=='WFEIX','Minimum Initial Purchase ($)'] =1000000
df_mf.loc[df_mf['Ticker']=='WFOPX','Minimum Initial Purchase ($)'] =1000
df_mf.loc[df_mf['Ticker']=='WIGRX','Minimum Initial Purchase ($)'] =100000
df_mf.loc[df_mf['Ticker']=='WSMGX','Minimum Initial Purchase ($)'] =250000
df_mf.loc[df_mf['Ticker']=='YFSIX','Minimum Initial Purchase ($)'] =100000

In [23]:
df_mf.loc[df_mf['Ticker']=='ACCLX','Total Assets ($ mil)'] =8200
df_mf.loc[df_mf['Ticker']=='ACGCX','Total Assets ($ mil)'] =2400
df_mf.loc[df_mf['Ticker']=='ACGQX','Total Assets ($ mil)'] =4900
df_mf.loc[df_mf['Ticker']=='ACSHX','Total Assets ($ mil)'] =8500
df_mf.loc[df_mf['Ticker']=='ADGZX','Total Assets ($ mil)'] =206
df_mf.loc[df_mf['Ticker']=='AFDIX','Total Assets ($ mil)'] =3200
df_mf.loc[df_mf['Ticker']=='AISZX','Total Assets ($ mil)'] =353
df_mf.loc[df_mf['Ticker']=='AIVSX','Total Assets ($ mil)'] =108400
df_mf.loc[df_mf['Ticker']=='AMCSX','Total Assets ($ mil)'] =188
df_mf.loc[df_mf['Ticker']=='AMGAX','Total Assets ($ mil)'] =289
df_mf.loc[df_mf['Ticker']=='AMRFX','Total Assets ($ mil)'] =69300
df_mf.loc[df_mf['Ticker']=='ANONX','Total Assets ($ mil)'] =1900
df_mf.loc[df_mf['Ticker']=='ARSKX','Total Assets ($ mil)'] =23
df_mf.loc[df_mf['Ticker']=='ARTSX','Total Assets ($ mil)'] =4000
df_mf.loc[df_mf['Ticker']=='BCIFX','Total Assets ($ mil)'] =37
df_mf.loc[df_mf['Ticker']=='BDSIX','Total Assets ($ mil)'] =3000
df_mf.loc[df_mf['Ticker']=='BFGIX','Total Assets ($ mil)'] =663
df_mf.loc[df_mf['Ticker']=='BIAUX','Total Assets ($ mil)'] =1000
df_mf.loc[df_mf['Ticker']=='BOSOX','Total Assets ($ mil)'] =626
df_mf.loc[df_mf['Ticker']=='BRSWX','Total Assets ($ mil)'] =327
df_mf.loc[df_mf['Ticker']=='BSCVX','Total Assets ($ mil)'] =140
df_mf.loc[df_mf['Ticker']=='BSPIX','Total Assets ($ mil)'] =26300
df_mf.loc[df_mf['Ticker']=='CAFFX','Total Assets ($ mil)'] =78500
df_mf.loc[df_mf['Ticker']=='CBECX','Total Assets ($ mil)'] =259
df_mf.loc[df_mf['Ticker']=='CBSAX','Total Assets ($ mil)'] =2000
df_mf.loc[df_mf['Ticker']=='CCASX','Total Assets ($ mil)'] =3900
df_mf.loc[df_mf['Ticker']=='CGPEX','Total Assets ($ mil)'] =12600
df_mf.loc[df_mf['Ticker']=='CHASX','Total Assets ($ mil)'] =72
df_mf.loc[df_mf['Ticker']=='CIDVX','Total Assets ($ mil)'] =15
df_mf.loc[df_mf['Ticker']=='CRMMX','Total Assets ($ mil)'] =393
df_mf.loc[df_mf['Ticker']=='CSXCX','Total Assets ($ mil)'] =3600
df_mf.loc[df_mf['Ticker']=='DCCCX','Total Assets ($ mil)'] =6500
df_mf.loc[df_mf['Ticker']=='DDFIX','Total Assets ($ mil)'] =15700
df_mf.loc[df_mf['Ticker']=='DHTYX','Total Assets ($ mil)'] =326
df_mf.loc[df_mf['Ticker']=='DMVAX','Total Assets ($ mil)'] =533
df_mf.loc[df_mf['Ticker']=='DNLRX','Total Assets ($ mil)'] =430
df_mf.loc[df_mf['Ticker']=='DRDIX','Total Assets ($ mil)'] =390
df_mf.loc[df_mf['Ticker']=='DTCAX','Total Assets ($ mil)'] =440
df_mf.loc[df_mf['Ticker']=='EAGCX','Total Assets ($ mil)'] =390
df_mf.loc[df_mf['Ticker']=='ECOLX','Total Assets ($ mil)'] =16
df_mf.loc[df_mf['Ticker']=='ECSTX','Total Assets ($ mil)'] =1500
df_mf.loc[df_mf['Ticker']=='EDFWX','Total Assets ($ mil)'] =45
df_mf.loc[df_mf['Ticker']=='EIMGX','Total Assets ($ mil)'] =123
df_mf.loc[df_mf['Ticker']=='ENSBX','Total Assets ($ mil)'] =48
df_mf.loc[df_mf['Ticker']=='ESGIX','Total Assets ($ mil)'] =24
df_mf.loc[df_mf['Ticker']=='ESPAX','Total Assets ($ mil)'] =4700
df_mf.loc[df_mf['Ticker']=='EVSTX','Total Assets ($ mil)'] =973
df_mf.loc[df_mf['Ticker']=='FACSX','Total Assets ($ mil)'] =333
df_mf.loc[df_mf['Ticker']=='FFIOX','Total Assets ($ mil)'] =163
df_mf.loc[df_mf['Ticker']=='FFQRX','Total Assets ($ mil)'] =72
df_mf.loc[df_mf['Ticker']=='FSGRX','Total Assets ($ mil)'] =3800
df_mf.loc[df_mf['Ticker']=='FTVNX','Total Assets ($ mil)'] =66
df_mf.loc[df_mf['Ticker']=='GBCCX','Total Assets ($ mil)'] =20
df_mf.loc[df_mf['Ticker']=='GBSAX','Total Assets ($ mil)'] =43
df_mf.loc[df_mf['Ticker']=='GCLLX','Total Assets ($ mil)'] =25
df_mf.loc[df_mf['Ticker']=='GENIX','Total Assets ($ mil)'] =205
df_mf.loc[df_mf['Ticker']=='GSCIX','Total Assets ($ mil)'] =883
df_mf.loc[df_mf['Ticker']=='GVCIX','Total Assets ($ mil)'] =316
df_mf.loc[df_mf['Ticker']=='GWEZX','Total Assets ($ mil)'] =624
df_mf.loc[df_mf['Ticker']=='HDGYX','Total Assets ($ mil)'] =10600
df_mf.loc[df_mf['Ticker']=='HEQCX','Total Assets ($ mil)'] =31
df_mf.loc[df_mf['Ticker']=='HFMDX','Total Assets ($ mil)'] =390
df_mf.loc[df_mf['Ticker']=='HHDFX','Total Assets ($ mil)'] =611
df_mf.loc[df_mf['Ticker']=='HNDDX','Total Assets ($ mil)'] =116
df_mf.loc[df_mf['Ticker']=='HNMVX','Total Assets ($ mil)'] =408
df_mf.loc[df_mf['Ticker']=='HRCVX','Total Assets ($ mil)'] =839
df_mf.loc[df_mf['Ticker']=='HULIX','Total Assets ($ mil)'] =31
df_mf.loc[df_mf['Ticker']=='IDANX','Total Assets ($ mil)'] =410
df_mf.loc[df_mf['Ticker']=='JAPAX','Total Assets ($ mil)'] =96
df_mf.loc[df_mf['Ticker']=='JBGCX','Total Assets ($ mil)'] =5000
df_mf.loc[df_mf['Ticker']=='JCSCX','Total Assets ($ mil)'] =3700
df_mf.loc[df_mf['Ticker']=='JDEAX','Total Assets ($ mil)'] =5100
df_mf.loc[df_mf['Ticker']=='JGACX','Total Assets ($ mil)'] =14100
df_mf.loc[df_mf['Ticker']=='JHKAX','Total Assets ($ mil)'] =34
df_mf.loc[df_mf['Ticker']=='JRSDX','Total Assets ($ mil)'] =1100
df_mf.loc[df_mf['Ticker']=='JSSSX','Total Assets ($ mil)'] =12
df_mf.loc[df_mf['Ticker']=='JSVAX','Total Assets ($ mil)'] =3800
df_mf.loc[df_mf['Ticker']=='JVACX','Total Assets ($ mil)'] =9400
df_mf.loc[df_mf['Ticker']=='KSOAX','Total Assets ($ mil)'] =184
df_mf.loc[df_mf['Ticker']=='LCGJX','Total Assets ($ mil)'] =675
df_mf.loc[df_mf['Ticker']=='LCIAX','Total Assets ($ mil)'] =2200
df_mf.loc[df_mf['Ticker']=='LDVCX','Total Assets ($ mil)'] =235
df_mf.loc[df_mf['Ticker']=='LEGCX','Total Assets ($ mil)'] =4900
df_mf.loc[df_mf['Ticker']=='LEVOX','Total Assets ($ mil)'] =1900
df_mf.loc[df_mf['Ticker']=='LSSIX','Total Assets ($ mil)'] =2900
df_mf.loc[df_mf['Ticker']=='LVPIX','Total Assets ($ mil)'] =7
df_mf.loc[df_mf['Ticker']=='MADVX','Total Assets ($ mil)'] =18400
df_mf.loc[df_mf['Ticker']=='MDCIX','Total Assets ($ mil)'] =603
df_mf.loc[df_mf['Ticker']=='MFCIX','Total Assets ($ mil)'] =640
df_mf.loc[df_mf['Ticker']=='MIDIX','Total Assets ($ mil)'] =196
df_mf.loc[df_mf['Ticker']=='MMEAX','Total Assets ($ mil)'] =78
df_mf.loc[df_mf['Ticker']=='MNNCX','Total Assets ($ mil)'] =399
df_mf.loc[df_mf['Ticker']=='MNRMX','Total Assets ($ mil)'] =7
df_mf.loc[df_mf['Ticker']=='MRLIX','Total Assets ($ mil)'] =92
df_mf.loc[df_mf['Ticker']=='MSEFX','Total Assets ($ mil)'] =251
df_mf.loc[df_mf['Ticker']=='MSSMX','Total Assets ($ mil)'] =1400
df_mf.loc[df_mf['Ticker']=='MUXAX','Total Assets ($ mil)'] =242
df_mf.loc[df_mf['Ticker']=='NBMLX','Total Assets ($ mil)'] =1900
df_mf.loc[df_mf['Ticker']=='NCBVX','Total Assets ($ mil)'] =229
df_mf.loc[df_mf['Ticker']=='NDGIX','Total Assets ($ mil)'] =54
df_mf.loc[df_mf['Ticker']=='NESNX','Total Assets ($ mil)'] =919
df_mf.loc[df_mf['Ticker']=='NEXTX','Total Assets ($ mil)'] =253
df_mf.loc[df_mf['Ticker']=='NGQAX','Total Assets ($ mil)'] =4
df_mf.loc[df_mf['Ticker']=='NSBFX','Total Assets ($ mil)'] =5900
df_mf.loc[df_mf['Ticker']=='NSPAX','Total Assets ($ mil)'] =233
df_mf.loc[df_mf['Ticker']=='NUESX','Total Assets ($ mil)'] =276
df_mf.loc[df_mf['Ticker']=='NWHZX','Total Assets ($ mil)'] =1700
df_mf.loc[df_mf['Ticker']=='OAYLX','Total Assets ($ mil)'] =4000
df_mf.loc[df_mf['Ticker']=='OSCAX','Total Assets ($ mil)'] =1200
df_mf.loc[df_mf['Ticker']=='OVECX','Total Assets ($ mil)'] =73
df_mf.loc[df_mf['Ticker']=='PBSRX','Total Assets ($ mil)'] =108
df_mf.loc[df_mf['Ticker']=='PCVAX','Total Assets ($ mil)'] =549
df_mf.loc[df_mf['Ticker']=='PECAX','Total Assets ($ mil)'] =401
df_mf.loc[df_mf['Ticker']=='PFPCX','Total Assets ($ mil)'] =314
df_mf.loc[df_mf['Ticker']=='PJGCX','Total Assets ($ mil)'] =198
df_mf.loc[df_mf['Ticker']=='PRCGX','Total Assets ($ mil)'] =66
df_mf.loc[df_mf['Ticker']=='PVEJX','Total Assets ($ mil)'] =2300
df_mf.loc[df_mf['Ticker']=='PZIMX','Total Assets ($ mil)'] =105
df_mf.loc[df_mf['Ticker']=='QASCX','Total Assets ($ mil)'] =838
df_mf.loc[df_mf['Ticker']=='RFNEX','Total Assets ($ mil)'] =114300
df_mf.loc[df_mf['Ticker']=='RPMIX','Total Assets ($ mil)'] =2000
df_mf.loc[df_mf['Ticker']=='RWMBX','Total Assets ($ mil)'] =135200
df_mf.loc[df_mf['Ticker']=='RYLGX','Total Assets ($ mil)'] =39
df_mf.loc[df_mf['Ticker']=='RYTFX','Total Assets ($ mil)'] =1300
df_mf.loc[df_mf['Ticker']=='SCRLX','Total Assets ($ mil)'] =2000
df_mf.loc[df_mf['Ticker']=='SCRYX','Total Assets ($ mil)'] =827
df_mf.loc[df_mf['Ticker']=='SCSMX','Total Assets ($ mil)'] =6100
df_mf.loc[df_mf['Ticker']=='SHAPX','Total Assets ($ mil)'] =7100
df_mf.loc[df_mf['Ticker']=='SLGCX','Total Assets ($ mil)'] =32
df_mf.loc[df_mf['Ticker']=='SLVAX','Total Assets ($ mil)'] =1200
df_mf.loc[df_mf['Ticker']=='SMEAX','Total Assets ($ mil)'] =1000
df_mf.loc[df_mf['Ticker']=='SMGIX','Total Assets ($ mil)'] =11200
df_mf.loc[df_mf['Ticker']=='SMVLX','Total Assets ($ mil)'] =1400
df_mf.loc[df_mf['Ticker']=='SPWAX','Total Assets ($ mil)'] =435
df_mf.loc[df_mf['Ticker']=='SSPSX','Total Assets ($ mil)'] =88
df_mf.loc[df_mf['Ticker']=='STVTX','Total Assets ($ mil)'] =1300
df_mf.loc[df_mf['Ticker']=='SUWCX','Total Assets ($ mil)'] =4100
df_mf.loc[df_mf['Ticker']=='SVTIX','Total Assets ($ mil)'] =12
df_mf.loc[df_mf['Ticker']=='TDFAX','Total Assets ($ mil)'] =551
df_mf.loc[df_mf['Ticker']=='TISPX','Total Assets ($ mil)'] =7100
df_mf.loc[df_mf['Ticker']=='TMMAX','Total Assets ($ mil)'] =964
df_mf.loc[df_mf['Ticker']=='TNVAX','Total Assets ($ mil)'] =134
df_mf.loc[df_mf['Ticker']=='TPLGX','Total Assets ($ mil)'] =5900
df_mf.loc[df_mf['Ticker']=='TPLNX','Total Assets ($ mil)'] =140
df_mf.loc[df_mf['Ticker']=='TQSAX','Total Assets ($ mil)'] =150
df_mf.loc[df_mf['Ticker']=='TRULX','Total Assets ($ mil)'] =2100
df_mf.loc[df_mf['Ticker']=='TSNCX','Total Assets ($ mil)'] =5000
df_mf.loc[df_mf['Ticker']=='UBVSX','Total Assets ($ mil)'] =5400
df_mf.loc[df_mf['Ticker']=='UCNQX','Total Assets ($ mil)'] =3700
df_mf.loc[df_mf['Ticker']=='USMVX','Total Assets ($ mil)'] =20
df_mf.loc[df_mf['Ticker']=='VAFNX','Total Assets ($ mil)'] =15200
df_mf.loc[df_mf['Ticker']=='VALUX','Total Assets ($ mil)'] =73
df_mf.loc[df_mf['Ticker']=='VDEQX','Total Assets ($ mil)'] =2400
df_mf.loc[df_mf['Ticker']=='VFFSX','Total Assets ($ mil)'] =179500
df_mf.loc[df_mf['Ticker']=='VLCAX','Total Assets ($ mil)'] =21500
df_mf.loc[df_mf['Ticker']=='VOLMX','Total Assets ($ mil)'] =38
df_mf.loc[df_mf['Ticker']=='VSEAX','Total Assets ($ mil)'] =8300
df_mf.loc[df_mf['Ticker']=='VSEMX','Total Assets ($ mil)'] =14300
df_mf.loc[df_mf['Ticker']=='VSFAX','Total Assets ($ mil)'] =6
df_mf.loc[df_mf['Ticker']=='VSMPX','Total Assets ($ mil)'] =205700
df_mf.loc[df_mf['Ticker']=='VSPVX','Total Assets ($ mil)'] =1600
df_mf.loc[df_mf['Ticker']=='VSTSX','Total Assets ($ mil)'] =205700
df_mf.loc[df_mf['Ticker']=='VYMYX','Total Assets ($ mil)'] =126
df_mf.loc[df_mf['Ticker']=='WEEIX','Total Assets ($ mil)'] =51
df_mf.loc[df_mf['Ticker']=='WFEIX','Total Assets ($ mil)'] =1100
df_mf.loc[df_mf['Ticker']=='WFOPX','Total Assets ($ mil)'] =1900
df_mf.loc[df_mf['Ticker']=='WIGRX','Total Assets ($ mil)'] =3500
df_mf.loc[df_mf['Ticker']=='WSMGX','Total Assets ($ mil)'] =48
df_mf.loc[df_mf['Ticker']=='YFSIX','Total Assets ($ mil)'] =136

In [24]:
df_mf.drop(df_mf[df_mf['Dividend Yield (%)']=='--'].index, inplace=True)
df_mf.drop(df_mf[df_mf['Morningstar Sustainability Rating']=='--'].index, inplace=True)
df_mf.drop(df_mf[df_mf['Turnover Ratio (%)']=='--'].index, inplace=True)

In [25]:
df_mf[(df_mf == '--').any(axis=1)]

  res_values = method(rvalues)


Unnamed: 0,Ticker,Morningstar Risk,Morningstar Sustainability Rating,3-year Return (%),Dividend Yield (%),% of Holdings in Cash,Price/Earnings,Price/Cash Flow,Average Market Cap ($ mil),ROE Last Year (%),Debt/Capital Last Year (%),No. of Holdings in Portfolio,% Assets in Top 10 Holdings,Turnover Ratio (%),Average Manager Tenure (years),Expense Ratio (%),No-load Funds,Minimum Initial Purchase ($),Total Assets ($ mil),Closed to New Investors,S&P500 3-year Return (%)


In [26]:
df_mf['S&P500 3-year Return (%)'] = df_mf['S&P500 3-year Return (%)'].replace(df_mf['S&P500 3-year Return (%)'], 10.3)

In [27]:
df_mf.info()

<class 'pandas.core.frame.DataFrame'>
Int64Index: 6016 entries, 0 to 6520
Data columns (total 21 columns):
 #   Column                             Non-Null Count  Dtype  
---  ------                             --------------  -----  
 0   Ticker                             6016 non-null   object 
 1   Morningstar Risk                   6016 non-null   object 
 2   Morningstar Sustainability Rating  6016 non-null   object 
 3   3-year Return (%)                  6016 non-null   object 
 4   Dividend Yield (%)                 6016 non-null   object 
 5   % of Holdings in Cash              6016 non-null   float64
 6   Price/Earnings                     6016 non-null   object 
 7   Price/Cash Flow                    6016 non-null   object 
 8   Average Market Cap ($ mil)         6016 non-null   object 
 9   ROE Last Year (%)                  6016 non-null   object 
 10  Debt/Capital Last Year (%)         6016 non-null   object 
 11  No. of Holdings in Portfolio       6016 non-null   int64

### Convert data type to integer or float

In [28]:
df_mf['Morningstar Sustainability Rating'] = df_mf['Morningstar Sustainability Rating'].astype(int)
df_mf['3-year Return (%)'] = df_mf['3-year Return (%)'].astype(float)
df_mf['Dividend Yield (%)'] = df_mf['Dividend Yield (%)'].astype(float)
df_mf['Price/Earnings'] = df_mf['Price/Earnings'].astype(float)
df_mf['Price/Cash Flow'] = df_mf['Price/Cash Flow'].astype(float)
df_mf['Average Market Cap ($ mil)'] = df_mf['Average Market Cap ($ mil)'].astype(int)
df_mf['ROE Last Year (%)'] = df_mf['ROE Last Year (%)'].astype(float)
df_mf['Debt/Capital Last Year (%)'] = df_mf['Debt/Capital Last Year (%)'].astype(float)
df_mf['% Assets in Top 10 Holdings'] = df_mf['% Assets in Top 10 Holdings'].astype(float)
df_mf['Turnover Ratio (%)'] = df_mf['Turnover Ratio (%)'].astype(int)
df_mf['Expense Ratio (%)'] = df_mf['Expense Ratio (%)'].astype(float)
df_mf['Minimum Initial Purchase ($)'] = df_mf['Minimum Initial Purchase ($)'].astype(int)
df_mf['% Assets in Top 10 Holdings'] = df_mf['% Assets in Top 10 Holdings'].astype(float)

In [29]:
df_mf.info()

<class 'pandas.core.frame.DataFrame'>
Int64Index: 6016 entries, 0 to 6520
Data columns (total 21 columns):
 #   Column                             Non-Null Count  Dtype  
---  ------                             --------------  -----  
 0   Ticker                             6016 non-null   object 
 1   Morningstar Risk                   6016 non-null   object 
 2   Morningstar Sustainability Rating  6016 non-null   int64  
 3   3-year Return (%)                  6016 non-null   float64
 4   Dividend Yield (%)                 6016 non-null   float64
 5   % of Holdings in Cash              6016 non-null   float64
 6   Price/Earnings                     6016 non-null   float64
 7   Price/Cash Flow                    6016 non-null   float64
 8   Average Market Cap ($ mil)         6016 non-null   int64  
 9   ROE Last Year (%)                  6016 non-null   float64
 10  Debt/Capital Last Year (%)         6016 non-null   float64
 11  No. of Holdings in Portfolio       6016 non-null   int64

In [30]:
df_mf.head()

Unnamed: 0,Ticker,Morningstar Risk,Morningstar Sustainability Rating,3-year Return (%),Dividend Yield (%),% of Holdings in Cash,Price/Earnings,Price/Cash Flow,Average Market Cap ($ mil),ROE Last Year (%),Debt/Capital Last Year (%),No. of Holdings in Portfolio,% Assets in Top 10 Holdings,Turnover Ratio (%),Average Manager Tenure (years),Expense Ratio (%),No-load Funds,Minimum Initial Purchase ($),Total Assets ($ mil),Closed to New Investors,S&P500 3-year Return (%)
0,AAAGX,Above Average,3,20.73,1.97,1.69,32.14,24.23,294701,31.56,44.55,45,55.73,58,2,1.14,No,2000,1768,No,10.3
1,AACIX,High,2,0.22,0.48,3.79,12.96,6.84,8740,2.21,48.49,124,18.37,35,6,0.95,Yes,250000,195,No,10.3
2,AADEX,Above Average,2,3.75,0.67,1.72,15.04,10.34,57742,12.54,48.12,168,21.82,67,12,0.63,Yes,250000,4242,No,10.3
3,AADGX,Below Average,3,6.39,0.66,2.62,21.85,16.11,14323,26.21,40.21,51,24.66,47,5,1.08,Yes,2500,70,No,10.3
4,AAGOX,Above Average,2,27.82,2.38,0.22,42.08,26.35,152652,21.25,36.98,59,47.3,144,19,0.89,Yes,0,446,No,10.3


### Add Outperform/Underperform column

In [31]:
df_mf['3-year Annualized Return vs. S&P500'] = df_mf['3-year Return (%)'] - df_mf['Expense Ratio (%)'] - df_mf['S&P500 3-year Return (%)']

In [32]:
df_mf.drop(['3-year Return (%)','S&P500 3-year Return (%)'], axis=1,inplace=True)

In [33]:
def outperform(return_diff):
    if return_diff > 0:
        return 'Outperform'
    elif return_diff < 0:
        return 'Underperform'

df_mf['Outperform / Underperform'] = df_mf['3-year Annualized Return vs. S&P500'].apply(outperform)

In [34]:
df_mf.head()

Unnamed: 0,Ticker,Morningstar Risk,Morningstar Sustainability Rating,Dividend Yield (%),% of Holdings in Cash,Price/Earnings,Price/Cash Flow,Average Market Cap ($ mil),ROE Last Year (%),Debt/Capital Last Year (%),No. of Holdings in Portfolio,% Assets in Top 10 Holdings,Turnover Ratio (%),Average Manager Tenure (years),Expense Ratio (%),No-load Funds,Minimum Initial Purchase ($),Total Assets ($ mil),Closed to New Investors,3-year Annualized Return vs. S&P500,Outperform / Underperform
0,AAAGX,Above Average,3,1.97,1.69,32.14,24.23,294701,31.56,44.55,45,55.73,58,2,1.14,No,2000,1768,No,9.29,Outperform
1,AACIX,High,2,0.48,3.79,12.96,6.84,8740,2.21,48.49,124,18.37,35,6,0.95,Yes,250000,195,No,-11.03,Underperform
2,AADEX,Above Average,2,0.67,1.72,15.04,10.34,57742,12.54,48.12,168,21.82,67,12,0.63,Yes,250000,4242,No,-7.18,Underperform
3,AADGX,Below Average,3,0.66,2.62,21.85,16.11,14323,26.21,40.21,51,24.66,47,5,1.08,Yes,2500,70,No,-4.99,Underperform
4,AAGOX,Above Average,2,2.38,0.22,42.08,26.35,152652,21.25,36.98,59,47.3,144,19,0.89,Yes,0,446,No,16.63,Outperform


In [35]:
df_mf['Outperform / Underperform'].value_counts()

Underperform    3373
Outperform      2643
Name: Outperform / Underperform, dtype: int64

In [36]:
df_mf[df_mf['3-year Annualized Return vs. S&P500']>0]['3-year Annualized Return vs. S&P500'].median()

6.0

In [37]:
df_mf[df_mf['3-year Annualized Return vs. S&P500']<0]['3-year Annualized Return vs. S&P500'].median()

-5.710000000000001

In [38]:
binary_mapper = {'Outperform':1, 'Underperform':0}
df_mf['Outperform / Underperform'] = df_mf['Outperform / Underperform'].replace(binary_mapper)

In [39]:
df_mf.to_csv('../Data/US_mutual_fund_data_cleaned',index=False)