In [None]:
import pandas as pd

# Load the dataset
file_path = 'Registos_Incendios_SGIF_2011_2020.xlsx'
df = pd.read_excel(file_path)

# Display the first few rows to understand the structure of the dataset
print(df.head())


In [None]:
# Convert relevant columns to datetime
df['DataHoraAlerta'] = pd.to_datetime(df['DataHoraAlerta'])
df['DataHoraIntervencao'] = pd.to_datetime(df['DataHoraIntervencao'])

# Convert 'Duracao_Horas' to numeric if it contains commas
df['Duracao_Horas'] = df['Duracao_Horas'].str.replace(',', '.').astype(float)

# Calculate response time in minutes
df['ResponseTime_Minutes'] = (df['DataHoraIntervencao'] - df['DataHoraAlerta']).dt.total_seconds() / 60

# Display the first few rows to verify the changes
print(df[['DataHoraAlerta', 'DataHoraIntervencao', 'Duracao_Horas', 'ResponseTime_Minutes']].head())


In [None]:
import matplotlib.pyplot as plt
import seaborn as sns
from scipy.stats import pearsonr

# Scatter plot to visualize the relationship
plt.figure(figsize=(10, 6))
sns.scatterplot(x='ResponseTime_Minutes', y='Duracao_Horas', data=df, alpha=0.6)
plt.xlabel('Response Time (Minutes)')
plt.ylabel('Duration of Fires (Hours)')
plt.title('Response Time vs Duration of Fires')
plt.show()

# Calculate the Pearson correlation coefficient
correlation, p_value = pearsonr(df['ResponseTime_Minutes'].dropna(), df['Duracao_Horas'].dropna())
print(f'Pearson Correlation: {correlation:.2f}, P-value: {p_value:.2e}')


In [None]:
# Extract year from the alert time
df['Year'] = df['DataHoraAlerta'].dt.year

# Average duration of fires and response times per year
yearly_stats = df.groupby('Year').agg({'Duracao_Horas': 'mean', 'ResponseTime_Minutes': 'mean'}).reset_index()

# Plot the trends over time
plt.figure(figsize=(14, 6))
sns.lineplot(x='Year', y='Duracao_Horas', data=yearly_stats, marker='o', label='Average Duration of Fires (Hours)')
sns.lineplot(x='Year', y='ResponseTime_Minutes', data=yearly_stats, marker='o', label='Average Response Time (Minutes)')
plt.xlabel('Year')
plt.ylabel('Average Value')
plt.title('Trends in Fire Duration and Response Times Over the Years')
plt.legend()
plt.show()
