In [1]:
import requests
import pandas as pd
import numpy as np

http_proxy  = "http://proxy-web.micron.com:80"
https_proxy = "http://proxy-web.micron.com:80"
proxyDict = { 
    "http":http_proxy, 
    "https":https_proxy              
}

pd.set_option('display.max_rows', None) #show every row for pandas
pd.set_option('display.max_columns', None) #show every column for pandas

g_year = 108
g_season = 1
g_how_many_year = 3

In [2]:
# sii:上市, otc:上櫃
# TWSE之數據是至該季的累計數據而非單季數據, EX: Q3=> TWSE: Q1~Q3, 財報狗:Q3
def financial_statement(year, season, stocktype, type='綜合損益彙總表'):
    if year >= 1000:
        year -= 1911
        
    if type == '綜合損益彙總表':
        url = 'https://mops.twse.com.tw/mops/web/ajax_t163sb04'
    elif type == '資產負債彙總表':
        url = 'https://mops.twse.com.tw/mops/web/ajax_t163sb05'
    elif type == '營益分析彙總表':
        url = 'https://mops.twse.com.tw/mops/web/ajax_t163sb06'
    else:
        print('type does not match')
    
    r = requests.post(url, {
        'encodeURIComponent':1,
        'step':1,
        'firstin':1,
        'off':1,
        'TYPEK':stocktype,
        'year':str(year),
        'season':str(season),
    }, stream=True)#, verify=False)#, proxies=proxyDict)
    
    r.encoding = 'utf8'
    dfs = pd.read_html(r.text)
    
    
    for i, df in enumerate(dfs):
        df.columns = df.iloc[0]
        dfs[i] = df.iloc[1:]
        
    df = pd.concat(dfs).applymap(lambda x: x if x != '--' else np.nan)
    df = df[df[u'公司代號'] != u'公司代號']
    df = df[~df[u'公司代號'].isnull()]
    
    #http://pandas.pydata.org/pandas-docs/stable/generated/pandas.DataFrame.add_suffix.html
    #http://pandas.pydata.org/pandas-docs/stable/generated/pandas.DataFrame.add_prefix.html
    suffix_format = "_{0}Q{1}".format(year, season)
    
    #return df.add_suffix(suffix_format)
    return df

In [3]:
def generate_df_for_stocktype(year, season, howmany_year_data, stocktype, title_name, with_col_name, sheettype):
    df = financial_statement(year, season, stocktype, type=sheettype)[[u'公司代號',u'公司名稱',with_col_name]]
    df.rename(columns = {df.columns[2]: '{0}_{1}Q{2}'.format(title_name, year, season)}, inplace = True)

    for i in range(howmany_year_data*4):
        # calculate previous quarter data 107Q1 => we want the previous data is 106Q4 AND then 106Q3, 106Q2, 106Q1, 105Q4
        if (season != 1):
            season = season - 1
        else:
            season = 4
            year = year - 1
        #https://pandas.pydata.org/pandas-docs/stable/generated/pandas.DataFrame.merge.html
        dfanother = financial_statement(year, season, stocktype, type=sheettype)[[u'公司代號',with_col_name]]    
        print(dfanother.columns[1])

        dfanother.rename(columns = {dfanother.columns[1]: '{0}_{1}Q{2}'.format(title_name, year, season)}, inplace = True)

        df = df.merge(dfanother, on=u'公司代號', how='inner')
        print("year:", year)
        #print("year: {0}".format(year))
        print("season:", season)
        #print("season: {0}".format(season))

    return df

In [4]:
#Accumulate quarter data
df_eps_sii = generate_df_for_stocktype(g_year, g_season, g_how_many_year, 'sii', 'EPS', u'基本每股盈餘（元）', '綜合損益彙總表')

df_eps_sii

of pandas will change to not sort by default.

To accept the future behavior, pass 'sort=False'.




基本每股盈餘（元）
('year:', 107)
('season:', 4)
基本每股盈餘（元）
('year:', 107)
('season:', 3)
基本每股盈餘（元）
('year:', 107)
('season:', 2)
基本每股盈餘（元）
('year:', 107)
('season:', 1)
基本每股盈餘（元）
('year:', 106)
('season:', 4)
基本每股盈餘（元）
('year:', 106)
('season:', 3)
基本每股盈餘（元）
('year:', 106)
('season:', 2)
基本每股盈餘（元）
('year:', 106)
('season:', 1)
基本每股盈餘（元）
('year:', 105)
('season:', 4)
基本每股盈餘（元）
('year:', 105)
('season:', 3)
基本每股盈餘（元）
('year:', 105)
('season:', 2)
基本每股盈餘（元）
('year:', 105)
('season:', 1)


Unnamed: 0,公司代號,公司名稱,EPS_108Q1,EPS_107Q4,EPS_107Q3,EPS_107Q2,EPS_107Q1,EPS_106Q4,EPS_106Q3,EPS_106Q2,EPS_106Q1,EPS_105Q4,EPS_105Q3,EPS_105Q2,EPS_105Q1
0,2801,彰化銀行,0.32,1.29,1.02,0.67,0.36,1.28,0.99,0.63,0.32,1.35,1.04,0.68,0.4
1,2809,京城銀行,1.6,2.51,3.19,2.04,1.13,4.89,3.74,2.4,1.08,4.17,3.12,1.92,0.96
2,2812,台中銀行,0.29,1.18,0.89,0.57,0.27,1.1,0.8,0.51,0.27,1.09,0.78,0.49,0.25
3,2820,華票,0.23,0.99,0.78,0.54,0.25,1.01,0.76,0.49,0.23,1.22,0.99,0.71,0.35
4,2834,臺灣企銀,0.34,1.19,0.94,0.64,0.3,0.82,0.76,0.51,0.25,0.87,0.67,0.46,0.24
5,2836,高銀,0.17,0.46,0.35,0.21,0.01,0.47,0.56,0.39,0.22,0.79,0.6,0.41,0.21
6,2838,聯邦銀行,0.26,1.07,0.86,0.53,0.26,1.05,0.78,0.49,0.25,1.01,0.77,0.47,0.25
7,2845,遠東商銀,0.35,1.08,0.83,0.54,0.23,0.9,0.78,0.53,0.24,1.04,0.79,0.54,0.28
8,2849,安泰銀行,0.31,1.26,0.83,0.55,0.26,1.24,0.96,0.6,0.3,0.63,0.41,0.26,0.04
9,2855,統一證券,0.67,0.87,0.88,0.75,0.08,1.88,1.28,0.8,0.54,0.62,0.78,0.23,0.15


In [5]:
#Every single quarter data

#Each Dataframe object has a member variable shape i.e. a tuple that contains dimensions of a dataframe like,
#(Number_of_index, Number_of_columns)
#idx = df_eps_sii.columns # the column index
#idx = df_eps_sii.index # the row index
numOfRows_s = df_eps_sii.shape[0] #len(df_eps_sii) #len(df_eps_sii.index)
numOfColumns_s = df_eps_sii.shape[1] #len(df_eps_sii.columns)
headNameOfColumns_s = df_eps_sii.columns

print(numOfColumns_s)
df_eps_sii

for row_index_s in range(0, numOfRows_s):
    for col_index_s in range(0, numOfColumns_s):
        #print(df_eps_sii.columns.values[col_index].find('Q1')) # index of match string
        #print("Q1" in df_eps_sii.columns.values[col_index]) # True OR False
        #How to Check if a Python String Contains Another String?
        if ("Q1" in df_eps_sii.columns.values[col_index_s]): # if (df_eps_sii.columns.values[col_index].find('Q1') > -1):
            continue
        else:
            if (u"公司代號" in df_eps_sii.columns.values[col_index_s]):
                continue
            elif (u"公司名稱" in df_eps_sii.columns.values[col_index_s]):
                continue
            elif (col_index_s == numOfColumns_s-1):
                continue
            else:
                df_eps_sii.iloc[row_index_s, col_index_s] = float(df_eps_sii.iloc[row_index_s, col_index_s]) - float(df_eps_sii.iloc[row_index_s, col_index_s+1])

df_eps_sii              

15


Unnamed: 0,公司代號,公司名稱,EPS_108Q1,EPS_107Q4,EPS_107Q3,EPS_107Q2,EPS_107Q1,EPS_106Q4,EPS_106Q3,EPS_106Q2,EPS_106Q1,EPS_105Q4,EPS_105Q3,EPS_105Q2,EPS_105Q1
0,2801,彰化銀行,0.32,0.27,0.35,0.31,0.36,0.29,0.36,0.31,0.32,0.31,0.36,0.28,0.4
1,2809,京城銀行,1.6,-0.68,1.15,0.91,1.13,1.15,1.34,1.32,1.08,1.05,1.2,0.96,0.96
2,2812,台中銀行,0.29,0.29,0.32,0.3,0.27,0.3,0.29,0.24,0.27,0.31,0.29,0.24,0.25
3,2820,華票,0.23,0.21,0.24,0.29,0.25,0.25,0.27,0.26,0.23,0.23,0.28,0.36,0.35
4,2834,臺灣企銀,0.34,0.25,0.3,0.34,0.3,0.06,0.25,0.26,0.25,0.2,0.21,0.22,0.24
5,2836,高銀,0.17,0.11,0.14,0.2,0.01,-0.09,0.17,0.17,0.22,0.19,0.19,0.2,0.21
6,2838,聯邦銀行,0.26,0.21,0.33,0.27,0.26,0.27,0.29,0.24,0.25,0.24,0.3,0.22,0.25
7,2845,遠東商銀,0.35,0.25,0.29,0.31,0.23,0.12,0.25,0.29,0.24,0.25,0.25,0.26,0.28
8,2849,安泰銀行,0.31,0.43,0.28,0.29,0.26,0.28,0.36,0.3,0.3,0.22,0.15,0.22,0.04
9,2855,統一證券,0.67,-0.01,0.13,0.67,0.08,0.6,0.48,0.26,0.54,-0.16,0.55,0.08,0.15


In [6]:
#Accumulate quarter data
df_eps_otc = generate_df_for_stocktype(g_year, g_season, g_how_many_year, 'otc', 'EPS', u'基本每股盈餘（元）', '綜合損益彙總表')

df_eps_otc

of pandas will change to not sort by default.

To accept the future behavior, pass 'sort=False'.




基本每股盈餘（元）
('year:', 107)
('season:', 4)
基本每股盈餘（元）
('year:', 107)
('season:', 3)
基本每股盈餘（元）
('year:', 107)
('season:', 2)
基本每股盈餘（元）
('year:', 107)
('season:', 1)
基本每股盈餘（元）
('year:', 106)
('season:', 4)
基本每股盈餘（元）
('year:', 106)
('season:', 3)
基本每股盈餘（元）
('year:', 106)
('season:', 2)
基本每股盈餘（元）
('year:', 106)
('season:', 1)
基本每股盈餘（元）
('year:', 105)
('season:', 4)
基本每股盈餘（元）
('year:', 105)
('season:', 3)
基本每股盈餘（元）
('year:', 105)
('season:', 2)
基本每股盈餘（元）
('year:', 105)
('season:', 1)


Unnamed: 0,公司代號,公司名稱,EPS_108Q1,EPS_107Q4,EPS_107Q3,EPS_107Q2,EPS_107Q1,EPS_106Q4,EPS_106Q3,EPS_106Q2,EPS_106Q1,EPS_105Q4,EPS_105Q3,EPS_105Q2,EPS_105Q1
0,6015,宏遠證券,0.29,-1.2,-0.72,0.07,-0.08,0.57,0.51,0.1,0.06,-0.4,-0.2,-0.18,-0.01
1,6016,康和證券,0.09,-0.45,-0.23,-0.08,-0.26,1.15,0.76,0.13,0.2,-0.57,-0.21,-0.29,0.08
2,6020,大展證,0.25,0.01,0.12,0.3,-0.03,0.95,0.86,0.38,0.36,0.08,0.17,0.01,0.11
3,6021,大慶證,0.0,0.64,0.69,0.36,0.13,0.55,0.47,0.29,0.16,-0.18,-0.15,-0.24,-0.12
4,6023,元大期貨,1.09,4.31,2.95,1.86,0.89,3.76,2.64,1.48,0.7,3.6,2.68,1.91,0.9
5,6026,福邦證券,0.39,0.15,0.46,0.46,0.34,2.0,1.52,0.99,0.43,0.5,0.55,0.16,0.2
6,1258,其祥-KY,-0.4,-4.05,-3.18,0.22,0.17,1.26,1.46,1.25,0.74,3.83,3.43,2.13,1.18
7,1259,安心,0.87,4.36,3.66,2.05,0.8,5.23,4.5,2.73,1.2,5.37,4.75,3.04,1.02
8,1264,德麥,3.2,13.27,10.0,6.32,2.85,13.41,10.02,6.6,3.64,14.54,10.38,6.84,3.39
9,1333,恩得利,-0.33,-1.44,-1.31,-1.81,-0.91,-1.93,-1.47,-0.89,-0.28,-0.76,-0.51,-0.28,-0.21


In [7]:
#Every single quarter data

#Each Dataframe object has a member variable shape i.e. a tuple that contains dimensions of a dataframe like,
#(Number_of_index, Number_of_columns)
#idx = df_eps_otc.columns # the column index
#idx = df_eps_otc.index # the row index
numOfRows_o = df_eps_otc.shape[0] #len(df_eps_otc) #len(df_eps_otc.index)
numOfColumns_o = df_eps_otc.shape[1] #len(df_eps_otc.columns)
headNameOfColumns_o = df_eps_otc.columns

print(numOfColumns_o)
df_eps_otc

for row_index_o in range(0, numOfRows_o):
    for col_index_o in range(0, numOfColumns_o):
        #print(df_eps_otc.columns.values[col_index].find('Q1')) # index of match string
        #print("Q1" in df_eps_otc.columns.values[col_index]) # True OR False
        #How to Check if a Python String Contains Another String?
        if ("Q1" in df_eps_otc.columns.values[col_index_o]): # if (df_eps_otc.columns.values[col_index].find('Q1') > -1):
            continue
        else:
            if (u"公司代號" in df_eps_otc.columns.values[col_index_o]):
                continue
            elif (u"公司名稱" in df_eps_otc.columns.values[col_index_o]):
                continue
            elif (col_index_o == numOfColumns_o-1):
                continue
            else:
                df_eps_otc.iloc[row_index_o, col_index_o] = float(df_eps_otc.iloc[row_index_o, col_index_o]) - float(df_eps_otc.iloc[row_index_o, col_index_o+1])

df_eps_otc              

15


Unnamed: 0,公司代號,公司名稱,EPS_108Q1,EPS_107Q4,EPS_107Q3,EPS_107Q2,EPS_107Q1,EPS_106Q4,EPS_106Q3,EPS_106Q2,EPS_106Q1,EPS_105Q4,EPS_105Q3,EPS_105Q2,EPS_105Q1
0,6015,宏遠證券,0.29,-0.48,-0.79,0.15,-0.08,0.06,0.41,0.04,0.06,-0.2,-0.02,-0.17,-0.01
1,6016,康和證券,0.09,-0.22,-0.15,0.18,-0.26,0.39,0.63,-0.07,0.2,-0.36,0.08,-0.37,0.08
2,6020,大展證,0.25,-0.11,-0.18,0.33,-0.03,0.09,0.48,0.02,0.36,-0.09,0.16,-0.1,0.11
3,6021,大慶證,0.0,-0.05,0.33,0.23,0.13,0.08,0.18,0.13,0.16,-0.03,0.09,-0.12,-0.12
4,6023,元大期貨,1.09,1.36,1.09,0.97,0.89,1.12,1.16,0.78,0.7,0.92,0.77,1.01,0.9
5,6026,福邦證券,0.39,-0.31,0.0,0.12,0.34,0.48,0.53,0.56,0.43,-0.05,0.39,-0.04,0.2
6,1258,其祥-KY,-0.4,-0.87,-3.4,0.05,0.17,-0.2,0.21,0.51,0.74,0.4,1.3,0.95,1.18
7,1259,安心,0.87,0.7,1.61,1.25,0.8,0.73,1.77,1.53,1.2,0.62,1.71,2.02,1.02
8,1264,德麥,3.2,3.27,3.68,3.47,2.85,3.39,3.42,2.96,3.64,4.16,3.54,3.45,3.39
9,1333,恩得利,-0.33,-0.13,0.5,-0.9,-0.91,-0.46,-0.58,-0.61,-0.28,-0.25,-0.23,-0.07,-0.21


In [8]:
#Database-style DataFrame joining/merging: join, merge
#Concatenating objects: concat, append

#ignore_index = True 可以忽略合併時舊的 index 欄位，改採用自動產生的 index
df_eps = pd.concat([df_eps_sii,df_eps_otc],axis=0, ignore_index=True)

df_eps

Unnamed: 0,公司代號,公司名稱,EPS_108Q1,EPS_107Q4,EPS_107Q3,EPS_107Q2,EPS_107Q1,EPS_106Q4,EPS_106Q3,EPS_106Q2,EPS_106Q1,EPS_105Q4,EPS_105Q3,EPS_105Q2,EPS_105Q1
0,2801,彰化銀行,0.32,0.27,0.35,0.31,0.36,0.29,0.36,0.31,0.32,0.31,0.36,0.28,0.4
1,2809,京城銀行,1.6,-0.68,1.15,0.91,1.13,1.15,1.34,1.32,1.08,1.05,1.2,0.96,0.96
2,2812,台中銀行,0.29,0.29,0.32,0.3,0.27,0.3,0.29,0.24,0.27,0.31,0.29,0.24,0.25
3,2820,華票,0.23,0.21,0.24,0.29,0.25,0.25,0.27,0.26,0.23,0.23,0.28,0.36,0.35
4,2834,臺灣企銀,0.34,0.25,0.3,0.34,0.3,0.06,0.25,0.26,0.25,0.2,0.21,0.22,0.24
5,2836,高銀,0.17,0.11,0.14,0.2,0.01,-0.09,0.17,0.17,0.22,0.19,0.19,0.2,0.21
6,2838,聯邦銀行,0.26,0.21,0.33,0.27,0.26,0.27,0.29,0.24,0.25,0.24,0.3,0.22,0.25
7,2845,遠東商銀,0.35,0.25,0.29,0.31,0.23,0.12,0.25,0.29,0.24,0.25,0.25,0.26,0.28
8,2849,安泰銀行,0.31,0.43,0.28,0.29,0.26,0.28,0.36,0.3,0.3,0.22,0.15,0.22,0.04
9,2855,統一證券,0.67,-0.01,0.13,0.67,0.08,0.6,0.48,0.26,0.54,-0.16,0.55,0.08,0.15


In [9]:
#檢查column資料型態

#df_eps.info() #non-null object
#df_eps.dtypes #object
#df_eps.applymap(np.isreal) #all False
'''
公司代號              int64
公司名稱             object
EPS(%)_107Q1    float64
EPS(%)_106Q4    float64
EPS(%)_106Q3    float64
EPS(%)_106Q2    float64
EPS(%)_106Q1    float64
EPS(%)_105Q4    float64
EPS(%)_105Q3    float64
EPS(%)_105Q2    float64
EPS(%)_105Q1    float64
EPS(%)_104Q4    float64
EPS(%)_104Q3    float64
EPS(%)_104Q2    float64
EPS(%)_104Q1    float64
dtype: object
'''

df_eps = df_eps.convert_objects(convert_numeric=True) #轉成float型態方便後續處理

df_eps.convert_objects(convert_numeric=True).dtypes #轉成float型態方便後續處理

For all other conversions use the data-type specific converters pd.to_datetime, pd.to_timedelta and pd.to_numeric.
For all other conversions use the data-type specific converters pd.to_datetime, pd.to_timedelta and pd.to_numeric.


公司代號           int64
公司名稱          object
EPS_108Q1    float64
EPS_107Q4    float64
EPS_107Q3    float64
EPS_107Q2    float64
EPS_107Q1    float64
EPS_106Q4    float64
EPS_106Q3    float64
EPS_106Q2    float64
EPS_106Q1    float64
EPS_105Q4    float64
EPS_105Q3    float64
EPS_105Q2    float64
EPS_105Q1    float64
dtype: object

In [10]:
def isFloat(element):  
    try:
        float(element)
        return True
    except ValueError:
        return False

In [11]:
def growth_func(row, year, season):
    previous_year = year - 1
    #判斷是否為文字而非數字
    if(isFloat(row['EPS_{0}Q{1}'.format(year, season)]) == True):
        subsequent_value = float(row['EPS_{0}Q{1}'.format(year, season)])
        previous_value = float(row['EPS_{0}Q{1}'.format(previous_year, season)])
   
        if(previous_value == 0):
            result = ((subsequent_value - previous_value)/np.abs(subsequent_value))*100
        else:
            result = ((subsequent_value - previous_value)/np.abs(previous_value))*100            
        return float("{0:.2f}".format(result)) # Limiting floats to two decimal points
     
    else:
        return 'NoValue'

In [12]:
def ma2q_growth_func(row, year, season):
    #判斷是否為文字而非數字
    if(isFloat(row['EPS_{0}Q{1}'.format(year, season)]) == True):
        previous_value = float(row['Growth_{0}Q{1}'.format(year, season)])
        if (season != 1):
            season = season - 1
        else:
            season = 4
            year = year - 1
        subsequent_value = float(row['Growth_{0}Q{1}'.format(year, season)])
        
        result = ((subsequent_value + previous_value)/2)
        return float("{0:.2f}".format(result)) # Limiting floats to two decimal points
    
    else:
        return 'NoValue'

In [13]:
# use the apply function in pandas to apply the function
# Note the axis=1 specifier, that means that the application is done at a row, rather than a column level
# df_eps.apply (lambda row: growth_func (row),axis=1)

year = g_year
season = g_season
howmany_year_data = g_how_many_year

#first 4 quarter don't need to be calculated growth
for i in range(int(howmany_year_data*4-4)):
    df_eps['Growth_{0}Q{1}'.format(year, season)] = df_eps.apply (lambda row: growth_func(row, year, season),axis=1)
    if (season != 1):
        season = season - 1
    else:
        season = 4
        year = year - 1

  if __name__ == '__main__':


In [14]:
# use the apply function in pandas to apply the function
# Note the axis=1 specifier, that means that the application is done at a row, rather than a column level
# df_eps.apply (lambda row: growth_func (row),axis=1)

year = g_year
season = g_season
howmany_year_data = g_how_many_year

#first 4 quarter don't need to be calculated growth
for i in range(int(howmany_year_data*4-4-1)):
    df_eps['2QMAGrowth_{0}Q{1}'.format(year, season)] = df_eps.apply (lambda row: ma2q_growth_func(row, year, season),axis=1)
    if (season != 1):
        season = season - 1
    else:
        season = 4
        year = year - 1

In [15]:
def get_basic_info_for_ftock(stocktype):

    #get basic info of company
    '''
    抓取上市櫃股票的代號、名稱...等資料。
    上市
    http://isin.twse.com.tw/isin/C_public.jsp?strMode=2
    上櫃
    http://isin.twse.com.tw/isin/C_public.jsp?strMode=4
    '''
    #http://bloggerkaiweng.blogspot.com/2016/09/python.html

    if(stocktype == 'sii'):
        url='http://isin.twse.com.tw/isin/C_public.jsp?strMode=2'
    else:
        url='http://isin.twse.com.tw/isin/C_public.jsp?strMode=4'
    
    r = requests.get(url, stream=True)#, verify=False, proxies=proxyDict)
    r.encoding = 'big5hkscs'
    dfshow = pd.read_html(r.text, header=None)

    for i, df in enumerate(dfshow):
        df.columns = df.iloc[0]
        dfshow[i] = df.iloc[1:]

    df = pd.concat(dfshow).applymap(lambda x: x if x != '--' else np.nan)
    df = df[df[u'有價證券代號及名稱'] != u'股票']
    df = df[~df[u'有價證券代號及名稱'].isnull()]
    df = df.reset_index(drop=True)
    
    newdf=df[df[u'產業別'] > '0']
    del newdf[u'國際證券辨識號碼(ISIN Code)'],newdf['CFICode'],newdf[u'備註']

    df2=newdf[u'有價證券代號及名稱'].str.split(u' ', expand=True)
    df2 = df2.reset_index(drop=True)
    newdf = newdf.reset_index(drop=True)
    for i in df2.index:
        if u'　' in df2.iat[i,0]:
            df2.iat[i,1]=df2.iat[i,0].split(u'　')[1]
            df2.iat[i,0]=df2.iat[i,0].split(u'　')[0]
    newdf=df2.join(newdf)
    newdf=newdf.rename(columns = {0:u'公司代號',1:u'股票名稱'})
    del newdf[u'有價證券代號及名稱']

    return newdf

In [16]:
df_basicinfo_sii = get_basic_info_for_ftock('sii').convert_objects(convert_numeric=True) #轉成float型態
df_basicinfo_otc = get_basic_info_for_ftock('otc').convert_objects(convert_numeric=True) #轉成float型態

df_basicinfo = pd.concat([df_basicinfo_sii,df_basicinfo_otc],axis=0, ignore_index=True)
#df_eps_basicinfo_sii.dtypes
#df_eps_basicinfo_otc

df_eps = df_eps.merge(df_basicinfo, on=u'公司代號', how='inner')

df_eps

For all other conversions use the data-type specific converters pd.to_datetime, pd.to_timedelta and pd.to_numeric.
  """Entry point for launching an IPython kernel.
For all other conversions use the data-type specific converters pd.to_datetime, pd.to_timedelta and pd.to_numeric.
  


Unnamed: 0,公司代號,公司名稱,EPS_108Q1,EPS_107Q4,EPS_107Q3,EPS_107Q2,EPS_107Q1,EPS_106Q4,EPS_106Q3,EPS_106Q2,EPS_106Q1,EPS_105Q4,EPS_105Q3,EPS_105Q2,EPS_105Q1,Growth_108Q1,Growth_107Q4,Growth_107Q3,Growth_107Q2,Growth_107Q1,Growth_106Q4,Growth_106Q3,Growth_106Q2,2QMAGrowth_108Q1,2QMAGrowth_107Q4,2QMAGrowth_107Q3,2QMAGrowth_107Q2,2QMAGrowth_107Q1,2QMAGrowth_106Q4,2QMAGrowth_106Q3,股票名稱,上市日,市場別,產業別
0,2801,彰化銀行,0.32,0.27,0.35,0.31,0.36,0.29,0.36,0.31,0.32,0.31,0.36,0.28,0.4,-11.11,-6.9,-2.78,0.0,12.5,-6.45,0.0,10.71,-9.0,-4.84,-1.39,6.25,3.02,-3.23,5.36,彰銀,1962/02/15,上市,金融保險業
1,2809,京城銀行,1.6,-0.68,1.15,0.91,1.13,1.15,1.34,1.32,1.08,1.05,1.2,0.96,0.96,41.59,-159.13,-14.18,-31.06,4.63,9.52,11.67,37.5,-58.77,-86.66,-22.62,-13.21,7.07,10.59,24.59,京城銀,1983/07/20,上市,金融保險業
2,2812,台中銀行,0.29,0.29,0.32,0.3,0.27,0.3,0.29,0.24,0.27,0.31,0.29,0.24,0.25,7.41,-3.33,10.34,25.0,0.0,-3.23,0.0,0.0,2.04,3.5,17.67,12.5,-1.61,-1.61,0.0,台中銀,1984/05/15,上市,金融保險業
3,2820,華票,0.23,0.21,0.24,0.29,0.25,0.25,0.27,0.26,0.23,0.23,0.28,0.36,0.35,-8.0,-16.0,-11.11,11.54,8.7,8.7,-3.57,-27.78,-12.0,-13.55,0.21,10.12,8.7,2.56,-15.68,華票,1994/10/26,上市,金融保險業
4,2834,臺灣企銀,0.34,0.25,0.3,0.34,0.3,0.06,0.25,0.26,0.25,0.2,0.21,0.22,0.24,13.33,316.67,20.0,30.77,20.0,-70.0,19.05,18.18,165.0,168.34,25.38,25.38,-25.0,-25.48,18.62,臺企銀,1998/01/03,上市,金融保險業
5,2836,高銀,0.17,0.11,0.14,0.2,0.01,-0.09,0.17,0.17,0.22,0.19,0.19,0.2,0.21,1600.0,222.22,-17.65,17.65,-95.45,-147.37,-10.53,-15.0,911.11,102.28,0.0,-38.9,-121.41,-78.95,-12.77,高雄銀,1998/05/18,上市,金融保險業
6,2838,聯邦銀行,0.26,0.21,0.33,0.27,0.26,0.27,0.29,0.24,0.25,0.24,0.3,0.22,0.25,0.0,-22.22,13.79,12.5,4.0,12.5,-3.33,9.09,-11.11,-4.21,13.14,8.25,8.25,4.58,2.88,聯邦銀,1998/06/29,上市,金融保險業
7,2845,遠東商銀,0.35,0.25,0.29,0.31,0.23,0.12,0.25,0.29,0.24,0.25,0.25,0.26,0.28,52.17,108.33,16.0,6.9,-4.17,-52.0,0.0,11.54,80.25,62.16,11.45,1.37,-28.09,-26.0,5.77,遠東銀,1998/11/27,上市,金融保險業
8,2849,安泰銀行,0.31,0.43,0.28,0.29,0.26,0.28,0.36,0.3,0.3,0.22,0.15,0.22,0.04,19.23,53.57,-22.22,-3.33,-13.33,27.27,140.0,36.36,36.4,15.68,-12.77,-8.33,6.97,83.64,88.18,安泰銀,1999/09/27,上市,金融保險業
9,2855,統一證券,0.67,-0.01,0.13,0.67,0.08,0.6,0.48,0.26,0.54,-0.16,0.55,0.08,0.15,737.5,-101.67,-72.92,157.69,-85.19,475.0,-12.73,225.0,317.92,-87.3,42.38,36.25,194.91,231.13,106.14,統一證,2002/09/16,上市,金融保險業


In [17]:
# pandas styling
def color_white(val):
    """
    Takes a scalar and returns a string with
    the css property `'color: red'` for negative
    strings, black otherwise.
    """
    color = 'white'
    return 'color: %s' % color

def background_color(val):    
    if float(val) < 0:
        backgroundcolor = '#ff0000'
    elif float(val) < 10:
        backgroundcolor = '#f47721'
    elif float(val) < 20:
        backgroundcolor = '#ffdd00'
    elif float(val) < 30:
        backgroundcolor = '#5ecc62'
    else:
        backgroundcolor = '#00ad45'
    return 'background-color: %s' % backgroundcolor

"""
Export to Excel
Some support is available for exporting styled DataFrames to Excel worksheets using the OpenPyXL or XlsxWriter engines. 
CSS2.2 properties handled include:

* background-color
* border-style, border-width, border-color and their {top, right, bottom, left variants}
* color
* font-family
* font-style
* font-weight
* text-align
* text-decoration
* vertical-align
* white-space: nowrap
"""
def font_family(val):    
    fontfamily = 'Calibri'
    return 'font-family: %s' % fontfamily

def font_size(val):    
    fontsize = '10pt'
    return 'font-size: %s' % fontsize

In [18]:
# styled dataframe can use .to_excel('Styled_Basic_EPS.xlsx', engine='openpyxl') to export excel with style
year = g_year
season = g_season
howmany_year_data = g_how_many_year

#first 4 quarter don't need to be calculated growth
columns_name = []
for i in range(int(howmany_year_data*4-4)):
    columns_name.append('Growth_{0}Q{1}'.format(year, season))
    columns_name.append('2QMAGrowth_{0}Q{1}'.format(year, season))
    if (season != 1):
        season = season - 1
    else:
        season = 4
        year = year - 1

print(columns_name)
# the cell’s style depends only on it’s own value. That means we should use the Styler.applymap method which works elementwise.
# Now suppose you wanted to highlight the maximum value in each column. We can’t use .applymap anymore since that operated elementwise. Instead, we’ll turn to .apply which operates columnwise (or rowwise using the axis keyword).
#df_eps.style.applymap(color_negative_red, subset=pd.IndexSlice[:, ['Growth_107Q1','Growth_106Q4','Growth_106Q3','Growth_106Q2','Growth_106Q1','Growth_105Q4','Growth_105Q3','Growth_105Q2']]).applymap(background_color, subset=pd.IndexSlice[:, ['Growth_107Q1','Growth_106Q4','Growth_106Q3','Growth_106Q2','Growth_106Q1','Growth_105Q4','Growth_105Q3','Growth_105Q2']]).to_excel('Styled_Basic_EPS.xlsx', 'EPS_Basic', engine='openpyxl')
df_eps.style.applymap(color_white, subset=pd.IndexSlice[:, columns_name]).applymap(background_color, subset=pd.IndexSlice[:, columns_name]).applymap(font_family).applymap(font_size).to_excel('Styled_Basic_Perspective_EPS.xlsx', 'EPS_Basic', engine='openpyxl')

# Pandas style function to hignlight specific columns
# http://pandas.pydata.org/pandas-docs/stable/style.html#Finer-Control:-Slicing
# Finer Control: Slicing
# ex: df.style.apply(highlight_max, subset=['B', 'C', 'D'])

['Growth_108Q1', '2QMAGrowth_108Q1', 'Growth_107Q4', '2QMAGrowth_107Q4', 'Growth_107Q3', '2QMAGrowth_107Q3', 'Growth_107Q2', '2QMAGrowth_107Q2', 'Growth_107Q1', '2QMAGrowth_107Q1', 'Growth_106Q4', '2QMAGrowth_106Q4', 'Growth_106Q3', '2QMAGrowth_106Q3', 'Growth_106Q2', '2QMAGrowth_106Q2']


Passing list-likes to .loc or [] with any missing label will raise
KeyError in the future, you can use .reindex() as an alternative.

See the documentation here:
https://pandas.pydata.org/pandas-docs/stable/indexing.html#deprecate-loc-reindex-listlike
  return self._getitem_tuple(key)
