## Loading packages

In [None]:
import pandas as pd
import numpy as np
from sklearn.metrics import mean_squared_error, r2_score

## Loading data

In [None]:
# Load the Excel file
file_path = 'bloomberg.xlsx'
sheet_name = 'AlimentacaoDomicilio'

# Read data from the specified sheet and use the first row as header
df = pd.read_excel(file_path, sheet_name=sheet_name, header=0)

# Convert the 'Focus' and 'Observado' columns to numeric, errors='coerce' will convert invalid parsing to NaN
df['Focus'] = pd.to_numeric(df['Focus'], errors='coerce')
df['Observado'] = pd.to_numeric(df['Observado'], errors='coerce')

# Drop rows where either 'Focus' or 'Observado' is missing
df_cleaned = df.dropna(subset=['Focus', 'Observado'])

## Accuracy Metrics

In [None]:
# Calculating R^2
r_squared = r2_score(df_cleaned['Observado'], df_cleaned['Focus'])

# Calculating MAPE (excluding rows where 'Observado' is zero)
mape = (np.abs((df_cleaned['Observado'] - df_cleaned['Focus']) / df_cleaned['Observado'])).mean() * 100

# Calculating RMSE
rmse = np.sqrt(mean_squared_error(df_cleaned['Observado'], df_cleaned['Focus']))

r_squared, mape, rmse