# Retreiving and Preparing Stock's Income Statement Information
This section of the code will concentrate on extracting stock's income statement information from IEX Cloud API. At the end, this section of the code will provide a complete and formatted income statement dataset.  

## Importing neccessary modules

In [16]:
import pandas as pd
import numpy as np
import requests
from datetime import date, datetime
from dateutil.relativedelta import relativedelta
import xlsxwriter

## Setting up base URL

Fetching the fundamentals and finacial data about the stock from ther IEX Cloud endpoints.

In [17]:
from api_secret import IEX_CLOUD_API_TOKEN

symbol = input("Enther the ticker here: ")

# API endpoints to collect stock data
income_endpoint = f'https://sandbox.iexapis.com/stable/stock/{symbol}/income?period=quarter&last=12&token={IEX_CLOUD_API_TOKEN}'
financials_endpoint = f'https://sandbox.iexapis.com/stable/stock/{symbol}/financials?period=quarter&last=12&token={IEX_CLOUD_API_TOKEN}'
fundamentals_endpoint = f'https://sandbox.iexapis.com/stable/stock/{symbol}/fundamentals?period=quarter&last=12&token={IEX_CLOUD_API_TOKEN}'

income_endpoint_data = requests.get(income_endpoint).json()
financials_endpoint_data = requests.get(financials_endpoint).json()
fundamentals_endpoint_data = requests.get(fundamentals_endpoint).json()

## Extracting the data
This part will concentrate on extracting the data that will form the final income statement for the stock.

### Forming the Dataset columns
The columns will be comprised of the Pandas DatetimeIndex. It will be created based on the quarters (reportDate) of the reported stock data.


First step is to find the quarters of the reported stock data.

In [18]:
reportDate_list = []
quarter_list = []

# Converting string date into the date object
for stock_data in income_endpoint_data['income']:
    converted_date = datetime.strptime(stock_data['reportDate'], '%Y-%m-%d').date()
    reportDate_list.append(converted_date)


# function to determine to which quarter the reported stock data
# is referred to
def quarter_finder(dates_list):
    global quarter_list

    for d in reportDate_list:
        q1 = date(d.year, 3, 31)
        q2 = date(d.year, 6, 30)
        q3 = date(d.year, 9, 30)
        q4 = date(d.year, 12, 31)

        if d < q1:
            q = date(d.year - relativedelta(year=1).year, 12, 31)
        if d > q1 and d < q2:
            q = date(d.year, 3, 30)
        if d > q2 and d < q3:
            q = date(d.year, 6, 30)
        if d > q3 and d < q4:
            q = date(d.year, 9, 30)
        
        quarter_list.append(q)

quarter_finder(reportDate_list)

The above created Datetime-like array will serve as an input to Pandas' DatetimeIndex objet (columns of the future dataset)

In [19]:
columns = pd.DatetimeIndex(data=quarter_list)

The next step is the creation of the actual DataFrame.

In [20]:
index = [
    'Total Revenue',
    'Total Revenue (Growth)',
    'Cost of Revenue',
    'Cost of Revenue (Growth)',
    'Gross Profit',
    'Gross Profit (Growth)',
    'Operating Expense',
    'SG&A',
    'SG&A (Growth)',
    'Research and Development',
    'Operating Income',
    'Pretax Income',
    'Pretax Income (Growth)',
    'Tax Provision',
    'Net Income',
    'Net Income (Growth)',
    'Basic EPS',
    'Basic EPS (Growth)',
    'Diluted EPS',
    'Total Expenses',
    'Total Expenses (Growth)',
    'Interest Income',
    'Inerest Income (Growth)',
    'Interest Expense',
    'Interest Expense (Growth)',
    'EBIT',
    'EBITDA',
    'EBITDA (Growth)'
]

income_statement = pd.DataFrame(columns=columns, index=index, data=None)

### Filling the dataframe with data returned by API endpoints.

The first API endpoint to get the stock data from is the 'financials' endpoint.

In [21]:
financials_dict = {
    'Total Revenue': [],
    'Operating Income': [],
    'Pretax Income': [],
    'Tax Provision': [],
    'Net Income': [],
    'Total Expenses': [],
    'Interest Income': [],
    'EBIT': [],
    'EBITDA': []
}


# Filling the financials_dict dictionary with data collected
# from the API endpoint
for quarter_data in financials_endpoint_data['financials']:
    financials_dict['Total Revenue'].append(quarter_data['totalRevenue'])
    financials_dict['Operating Income'].append(quarter_data['operatingIncome'])
    financials_dict['Pretax Income'].append(quarter_data['pretaxIncome'])
    financials_dict['Tax Provision'].append(quarter_data['incomeTax'])
    financials_dict['Net Income'].append(quarter_data['netIncome'])
    financials_dict['Total Expenses'].append(quarter_data['operatingExpense'])
    financials_dict['Interest Income'].append(quarter_data['interestIncome'])
    financials_dict['EBIT'].append(quarter_data['ebit'])
    financials_dict['EBITDA'].append(quarter_data['EBITDA'])


# Putting the data into the DataFrame
for stock_attribute in financials_dict:
    for row in income_statement.index:
        if row == stock_attribute:
            income_statement.loc[row] = financials_dict[stock_attribute]


The second is the income API endpoint.

In [22]:
income_dict = {
    'Cost of Revenue': [],
    'Gross Profit': [],
    'Operating Expense': [],
    'SG&A': [],
    'Research and Development': []
}

for quarter_data in income_endpoint_data['income']:
    income_dict['Cost of Revenue'].append(quarter_data['costOfRevenue'])
    income_dict['Gross Profit'].append(quarter_data['grossProfit'])
    income_dict['Operating Expense'].append(quarter_data['operatingExpense'])
    income_dict['SG&A'].append(quarter_data['sellingGeneralAndAdmin'])
    income_dict['Research and Development'].append(quarter_data['researchAndDevelopment'])

for stock_attribute in income_dict:
    for row in income_statement.index:
        if row == stock_attribute:
            income_statement.loc[row] = income_dict[stock_attribute]

The final endpoint to use the data from in the dataset is the fundamentals endpoint.

In [23]:
fundamentals_dict = {
    'Basic EPS': [],
    'Diluted EPS': [],
    'Interest Expense': []
}

for quarter_data in fundamentals_endpoint_data['fundamentals']:
    fundamentals_dict['Basic EPS'].append(quarter_data['incomeNetPerWabsoSplitAdjusted'])
    fundamentals_dict['Diluted EPS'].append(quarter_data['incomeNetPerWadsoSplitAdjusted'])
    fundamentals_dict['Interest Expense'].append(quarter_data['expensesInterest'])

for stock_attribute in fundamentals_dict:
    for row in income_statement.index:
        if row == stock_attribute:
            income_statement.loc[row] = fundamentals_dict[stock_attribute]

## Calculating the Growth

Below section deals with the 'Growth' columns to give an investor an advantage of company's success metric.

In [82]:
# Calculating the growth rate based on the stock metrics' 
for df_index, row_name in enumerate(income_statement.index):
    if 'Growth' in row_name:
        for row_index, value in enumerate(income_statement.iloc[df_index - 1]):
            try:
                growth_rate = (value / income_statement.iloc[df_index - 1, row_index + 1]) * 100
                income_statement.iloc[df_index, row_index] = (growth_rate - 100) / 100
            except IndexError:
                break

income_statement

Unnamed: 0,2022-09-30,2022-06-30,2022-03-30,2021-12-31,2021-09-30,2021-06-30,2021-03-30,2020-12-31,2020-09-30,2020-06-30,2020-03-30,2019-12-31
Total Revenue,1200384000.0,1051042000.0,990269600.0,1008282000.0,868637800.0,839340400.0,736265700.0,773230200.0,682336400.0,615686800.0,590266000.0,631836664.0
Total Revenue (Growth),0.1420893,0.06136979,-0.01786398,0.1607617,0.03490529,0.1399966,-0.04780525,0.1332096,0.1082526,0.04306652,-0.0657933,
Cost of Revenue,292115500.0,261064600.0,256682900.0,234959100.0,213374200.0,195547400.0,162131100.0,170921000.0,140970600.0,140519600.0,132319600.0,140963949.0
Cost of Revenue (Growth),0.1189395,0.01707037,0.09245779,0.1011599,0.0911636,0.2061064,-0.05142656,0.2124588,0.003209017,0.06197126,-0.06132286,
Gross Profit,876215900.0,811896400.0,708894100.0,769795700.0,678820700.0,633848300.0,559424600.0,603969600.0,512455500.0,495893900.0,453009800.0,480269456.0
Gross Profit (Growth),0.07922122,0.1453,-0.07911395,0.1340192,0.07095138,0.1330361,-0.07375368,0.1785797,0.03339729,0.09466503,-0.05675917,
Operating Expense,919103600.0,837678900.0,820849700.0,754772200.0,717770100.0,677686400.0,591727500.0,588582300.0,546045200.0,519943000.0,508516400.0,517703188.0
SG&A,483892200.0,472134600.0,436931500.0,417287700.0,401858500.0,372403300.0,345335900.0,330328700.0,306340000.0,293036900.0,302341100.0,298137836.0
SG&A (Growth),0.02490305,0.08056908,0.04707491,0.03839464,0.07909494,0.07837994,0.04543088,0.0783075,0.04539748,-0.0307739,0.01409834,
Research and Development,135600500.0,126982100.0,131040600.0,114566400.0,110588700.0,108326700.0,99816790.0,90760800.0,90865130.0,84755040.0,83820620.0,74721417.0


Dealing with NaN values.

In [1]:
income_statement.fillna(value='', inplace=True)

NameError: name 'income_statement' is not defined