# TSA Chapter 8: GPH Log-Periodogram Estimation

[![Open In Colab](https://colab.research.google.com/assets/colab-badge.svg)](https://colab.research.google.com/github/QuantLet/TSA/blob/main/TSA_ch8/TSA_ch8_gph_estimation/TSA_ch8_gph_estimation.ipynb)

Log-periodogram regression for estimating d.

In [None]:
!pip install numpy pandas matplotlib statsmodels scikit-learn scipy -q

In [None]:
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
from scipy import stats
from sklearn.ensemble import RandomForestRegressor
from sklearn.metrics import mean_squared_error
from statsmodels.tsa.stattools import acf
import warnings
warnings.filterwarnings('ignore')

In [None]:
import os
COLORS = {'blue': '#1A3A6E', 'red': '#DC3545', 'green': '#2E7D32', 'orange': '#E67E22', 'gray': '#666666', 'purple': '#8E44AD'}
BLUE, RED, GREEN, ORANGE, GRAY, PURPLE = COLORS['blue'], COLORS['red'], COLORS['green'], COLORS['orange'], COLORS['gray'], COLORS['purple']
plt.rcParams.update({
    'figure.facecolor': 'none', 'axes.facecolor': 'none', 'savefig.facecolor': 'none',
    'savefig.transparent': True, 'axes.spines.top': False, 'axes.spines.right': False,
    'axes.grid': False, 'font.size': 10, 'axes.titlesize': 12, 'axes.labelsize': 10,
    'xtick.labelsize': 9, 'ytick.labelsize': 9, 'legend.fontsize': 9, 'figure.dpi': 150,
    'lines.linewidth': 1.2, 'axes.linewidth': 0.6, 'legend.facecolor': 'none',
    'legend.framealpha': 0, 'legend.edgecolor': 'none',
})
def save_chart(fig, name):
    fig.savefig(f'{name}.pdf', bbox_inches='tight', transparent=True, dpi=150)
    fig.savefig(f'{name}.png', bbox_inches='tight', transparent=True, dpi=150)
    print(f'Saved: {name}')

In [None]:
np.random.seed(42); n = 1000
x = np.random.normal(0, 1, n)
freq = np.arange(1, n//2+1) * 2*np.pi/n
periodogram = np.abs(np.fft.fft(x)[1:n//2+1])**2 / (2*np.pi*n)
m = int(n**0.5)
log_freq = np.log(4*np.sin(freq[:m]/2)**2); log_period = np.log(periodogram[:m])
from numpy.polynomial import polynomial as P
coef = np.polyfit(log_freq, log_period, 1); d_hat = -coef[0]/2
fig, ax = plt.subplots(figsize=(8, 4))
ax.scatter(log_freq, log_period, color=BLUE, alpha=0.5, s=15)
ax.plot(log_freq, np.polyval(coef, log_freq), color=RED, lw=2, label=f'GPH: d = {d_hat:.3f}')
ax.set_xlabel('log(frequency)'); ax.set_ylabel('log(periodogram)')
ax.set_title('GPH Log-Periodogram Regression', fontweight='bold')
ax.legend(loc='upper center', bbox_to_anchor=(0.5, -0.15), frameon=False)
plt.tight_layout(); save_chart(fig, 'ch8_arima_vs_arfima_real'); plt.show()