In [5]:
import sys
import os
sys.path.append(os.path.abspath(os.path.join(os.getcwd(), '..')))

import pandas as pd
from datetime import datetime, timezone
import logging

logging.basicConfig(
    level=logging.INFO,  # Set the logging level
    format='%(asctime)s - %(levelname)s - %(message)s',  # Format for the log messages
    handlers=[
        logging.StreamHandler()  # Log to the console
    ]
)

%reload_ext autoreload
%autoreload 2
from data.raw.retrievers.alpaca_markets_retriever import AlpacaMarketsRetriever
from config.constants import *
from data.processed.dataset_creation import DatasetCreator
from data.processed.indicators import *
from data.processed.targets import Balanced3ClassClassification
from data.processed.normalization import ZScoreOverWindowNormalizer, ZScoreNormalizer, MinMaxNormalizer
from data.processed.missing_values_handling import DummyMissingValuesHandler
from data.processed.dataset_pytorch import DatasetPytorch
from modeling.trainer import Trainer
from observability.mlflow_integration import log_experiment

from config.experiments.cur_experiment import config

  from .autonotebook import tqdm as notebook_tqdm


In [12]:
retriever = AlpacaMarketsRetriever()

retrieval_result = retriever.bars(
    symbol_or_symbols='TSLA', 
    start=config.data_config.start, 
    end=config.data_config.end)

In [13]:
dataset_creator = DatasetCreator(
    features=config.data_config.features,
    target=config.data_config.target,
    normalizer=config.data_config.normalizer,
    missing_values_handler=config.data_config.missing_values_handler,
    train_set_last_date=config.data_config.train_set_last_date, 
    in_seq_len=config.data_config.in_seq_len,
    multi_asset_prediction=config.data_config.multi_asset_prediction,
)
features = dataset_creator.create_dataset_numpy(retrieval_result)

2025-06-21 14:56:05,731 - INFO - Processing TSLA...
2025-06-21 14:56:05,861 - INFO - Filtered by regular hours!
2025-06-21 14:56:06,007 - INFO - Missing values are handled!
2025-06-21 14:56:06,011 - INFO - Total ohlvc rows: 39882. Rows with nulls: 0
2025-06-21 14:56:07,464 - INFO - Features calculated!
2025-06-21 14:56:07,521 - INFO - Features normalized!
2025-06-21 14:56:07,552 - INFO - Target calculated!


In [14]:
features['TSLA']

Unnamed: 0,date,open,high,low,close,volume,return,OBV,RSI6,RSI12,...,ATR_28,FRL_0,FRL_1,FRL_2,FRL_3,FRL_4,RSI_28,Oscillator_K,Oscillator_D,target
0,2025-01-02 13:30:00+00:00,0.864016,0.862829,0.863156,0.863593,0.00133,,0.347404,,,...,0.099815,,,,,,,,,1.0
1,2025-01-02 13:31:00+00:00,0.863703,0.863648,0.865185,0.863593,0.00078,0.528465,0.347404,,,...,0.095548,,,,,,,,,2.0
2,2025-01-02 13:32:00+00:00,0.864596,0.863724,0.864252,0.864754,0.001198,0.533221,0.34751,1.0,1.0,...,0.095114,,,,,,1.0,,,0.0
3,2025-01-02 13:33:00+00:00,0.864819,0.863634,0.864475,0.8627,0.00077,0.520055,0.347442,0.361111,0.361111,...,0.093774,,,,,,0.314424,,,1.0
4,2025-01-02 13:34:00+00:00,0.863257,0.862516,0.864519,0.863369,0.000635,0.53121,0.347498,0.471264,0.471264,...,0.088472,,,,,,0.432627,,,0.0
5,2025-01-02 13:35:00+00:00,0.863525,0.862516,0.861364,0.860737,0.002294,0.517678,0.347296,0.280899,0.280899,...,0.094452,,,,,,0.228351,,,1.0
6,2025-01-02 13:36:00+00:00,0.861026,0.860235,0.861127,0.859886,0.001011,0.524976,0.347207,0.248485,0.248485,...,0.092899,,,,,,0.193568,,,2.0
7,2025-01-02 13:37:00+00:00,0.860178,0.861017,0.861853,0.861485,0.000766,0.535029,0.347274,0.382501,0.382501,...,0.092253,,,,,,0.337377,,,1.0
8,2025-01-02 13:38:00+00:00,0.862364,0.861219,0.863186,0.862298,0.001134,0.531796,0.347374,0.357513,0.43379,...,0.087056,,,,,,0.392414,,,1.0
9,2025-01-02 13:39:00+00:00,0.862409,0.861219,0.863186,0.862208,0.000793,0.528099,0.347304,0.463087,0.429864,...,0.082217,0.863712,0.863191,0.862768,0.862343,0.861814,0.388202,,,0.0


In [10]:
aapl = features['AAPL']
aapl.to_csv('aapl.csv')

In [11]:
msft = features['MSFT']
msft.to_csv('msft.csv')

In [None]:
retriever = AlpacaMarketsRetriever()

retrieval_result = retriever.bars(
    symbol_or_symbols=con, 
    start=datetime(2025, 6, 6), 
    end=datetime(2025, 6, 10))