In [1]:
import sqlite3
import pandas as pd

db_conn = sqlite3.connect('/home/orestis/code/Orestis/InvestorAPI/app/database/ibd.db')

query = '''
    SELECT * 
    FROM price_prediction_dataset 
    WHERE DATE(fiscal_date_ending) <= date('now', '-3 months')
    ORDER BY DATE(fiscal_date_ending)
'''

stocks_df = pd.read_sql(query, db_conn)
db_conn.close()


In [4]:
stocks_df.columns

columns_to_keep = [
    # Income statement
    'total_revenue',
    'gross_profit',
    'operating_income',
    'net_income',
    'ebitda',
    'net_interest_income',
    
    # Balance sheet
    'total_assets',
    'total_liabilities',
    'total_shareholder_equity',
    'total_current_assets',
    'total_current_liabilities',
    'cash_and_cash_equivalents_at_carrying_value',
    'long_term_debt',
    'current_net_receivables',
    'inventory',
    'property_plant_equipment',

    # Cash flow
    'operating_cashflow',
    'capital_expenditures',
    'cashflow_from_investment',
    'cashflow_from_financing',
    'dividend_payout',
    'proceeds_from_issuance_of_long_term_debt_and_capital_securities_net',
    'payments_for_repurchase_of_equity'

    # Economic indicators
    'avg_interest_rate',
    'avg_treasury_yield'
    'inflation',
    #'gdp'

    # Stock related
    'sector',
    'avg_three_months_price',
    'avg_next_three_months_price'
]   

In [5]:
filtered_df = stocks_df[columns_to_keep]

In [6]:
columns_with_zeros = filtered_df.columns[filtered_df.eq(0).any()]
if len(columns_with_zeros) > 0:
    print(f"Columns with zero values: {columns_with_zeros}")
else:
    print("No columns have zero values.")


Columns with zero values: Index(['total_revenue', 'gross_profit', 'operating_income', 'net_income',
       'ebitda', 'net_interest_income', 'total_assets', 'total_liabilities',
       'total_shareholder_equity', 'total_current_assets',
       'total_current_liabilities',
       'cash_and_cash_equivalents_at_carrying_value', 'long_term_debt',
       'current_net_receivables', 'inventory', 'property_plant_equipment',
       'operating_cashflow', 'capital_expenditures',
       'cashflow_from_investment', 'cashflow_from_financing',
       'dividend_payout',
       'proceeds_from_issuance_of_long_term_debt_and_capital_securities_net',
       'payments_for_repurchase_of_equity'],
      dtype='object')


Income statement
Total revenue
Gross profit
Operating income
Net income
Ebitda
Net interest income

Balance sheet
Total assets
Total liabilities
Total shareholder equity
Total current assets
Total current liabilities
Cash and cash equivalents
Long term debt
Net receivables
Inventory
Property plant and equipment(ppe)

Cash flow
Operating cash flow
Capital expenditures
Cash flow from investing activities
Cash flow from financing activities
Divedend payout
Proceeds from Issuance of Long-Term Debt and Capital Securities Net
Payment from repurchase of equity
