# TSA Chapter 8: Model Comparison

[![Open In Colab](https://colab.research.google.com/assets/colab-badge.svg)](https://colab.research.google.com/github/QuantLet/TSA/blob/main/TSA_ch8/TSA_ch8_model_comparison/TSA_ch8_model_comparison.ipynb)

Comparison of ARIMA, ARFIMA, Random Forest, and LSTM: prediction accuracy vs computational cost.

In [None]:
!pip install numpy pandas matplotlib scikit-learn statsmodels -q

In [None]:
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import warnings
warnings.filterwarnings('ignore')

In [None]:
COLORS = {'blue': '#1A3A6E', 'red': '#DC3545', 'green': '#2E7D32', 'orange': '#E67E22', 'gray': '#666666', 'purple': '#8E44AD'}
BLUE, RED, GREEN, ORANGE, GRAY, PURPLE = COLORS['blue'], COLORS['red'], COLORS['green'], COLORS['orange'], COLORS['gray'], COLORS['purple']
plt.rcParams.update({
    'figure.facecolor': 'none', 'axes.facecolor': 'none', 'savefig.facecolor': 'none',
    'savefig.transparent': True, 'axes.spines.top': False, 'axes.spines.right': False,
    'axes.grid': False, 'font.size': 10, 'axes.titlesize': 12, 'axes.labelsize': 10,
    'xtick.labelsize': 9, 'ytick.labelsize': 9, 'legend.fontsize': 9, 'figure.dpi': 150,
    'lines.linewidth': 1.2, 'axes.linewidth': 0.6, 'legend.facecolor': 'none',
    'legend.framealpha': 0, 'legend.edgecolor': 'none',
})
def save_chart(fig, name):
    fig.savefig(f'{name}.pdf', bbox_inches='tight', transparent=True, dpi=150)
    fig.savefig(f'{name}.png', bbox_inches='tight', transparent=True, dpi=150)
    print(f'Saved: {name}')

In [None]:
# Model comparison: Accuracy vs Computational Cost
models = ['ARIMA', 'ARFIMA', 'Random\nForest', 'LSTM']
colors_bar = [BLUE, GREEN, ORANGE, RED]

# Typical RMSE values (lower is better)
rmse_values = [45.2, 42.8, 28.5, 31.2]
# Relative training times
training_times = [1.0, 1.5, 8.0, 45.0]

fig, axes = plt.subplots(1, 2, figsize=(14, 5))

# RMSE comparison
bars1 = axes[0].bar(models, rmse_values, color=colors_bar, alpha=0.8,
                    edgecolor='white', linewidth=0.5)
axes[0].set_ylabel('RMSE (lower is better)')
axes[0].set_title('Prediction Accuracy Comparison', fontweight='bold', fontsize=12)
y_max = max(rmse_values) * 1.3
axes[0].set_ylim(0, y_max)
for bar, val in zip(bars1, rmse_values):
    axes[0].text(bar.get_x() + bar.get_width()/2, val + y_max * 0.02, f'{val:.1f}',
                 ha='center', fontsize=11, fontweight='bold')

# Training time comparison (log scale)
bars2 = axes[1].bar(models, training_times, color=colors_bar, alpha=0.8,
                    edgecolor='white', linewidth=0.5)
axes[1].set_ylabel('Relative Training Time')
axes[1].set_title('Computational Cost Comparison', fontweight='bold', fontsize=12)
axes[1].set_yscale('log')
for bar, val in zip(bars2, training_times):
    axes[1].text(bar.get_x() + bar.get_width()/2, val * 1.2, f'{val:.0f}x',
                 ha='center', fontsize=11, fontweight='bold')

plt.tight_layout()
save_chart(fig, 'ch8_model_comparison')
plt.show()