In [None]:
# Imports
import pandas as pd
from stable_baselines3 import PPO
from stable_baselines3.common.vec_env import DummyVecEnv
from src.rl_env.trading_env import TradingEnv
from src.agents.evaluate import evaluate_agent


In [None]:
# Load Data
data = pd.read_csv("data/AAPL.csv", parse_dates=['Date'])

In [None]:
# Create environment
env = DummyVecEnv([lambda: TradingEnv(data, ticker="AAPL")])

In [None]:
# Tune PPO - basic config
total_timesteps = 10000
model = PPO("MlpPolicy", env, verbose=1)
model.learn(total_timesteps=total_timesteps)
model.save("models/ppo_AAPL")

In [None]:
# Evaluate agent
summary_df = evaluate_agent("models/ppo_AAPL.zip", data, "AAPL")
display(summary_df.tail())


In [None]:
# Plot trades
from src.visualizations.plot_trades import plot_trades
plot_trades(summary_df, title="RL Agent Trades - AAPL")
