# 🎬 Movie Theater Attendance vs Economic Conditions in Turkey

In this project, we analyze how macroeconomic indicators like GDP and inflation affect movie theater attendance in Turkey.
We test whether economic prosperity correlates with higher cinema attendance, while economic hardship causes a decline.


In [None]:
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
from sklearn.linear_model import LinearRegression
from sklearn.preprocessing import StandardScaler
from sklearn.metrics import mean_squared_error, r2_score
from scipy.stats import pearsonr

# Load Data
df = pd.read_csv("final_cinema_economic_data.csv")


In [None]:
# Total Audience Over Time
plt.figure(figsize=(10,6))
plt.plot(df["Year"], df["TotalAudience"], marker='o')
plt.title("Total Movie Audience Over Time")
plt.xlabel("Year")
plt.ylabel("Audience Count")
plt.grid()
plt.show()


In [None]:
# Inflation Rate Over Time
plt.figure(figsize=(10,6))
plt.plot(df["Year"], df["InflationRate"], marker='s', color="orange")
plt.title("Inflation Rate Over Time")
plt.xlabel("Year")
plt.ylabel("Inflation Rate (%)")
plt.grid()
plt.show()


In [None]:
# GDP Over Time
plt.figure(figsize=(10,6))
plt.plot(df["Year"], df["GDP"], marker='^', color="green")
plt.title("Turkey GDP Over Time")
plt.xlabel("Year")
plt.ylabel("GDP (Current US$)")
plt.grid()
plt.show()


In [None]:
# GDP vs Audience
sns.scatterplot(x="GDP", y="TotalAudience", data=df)
plt.title("GDP vs Total Movie Audience")
plt.xlabel("GDP (Current US$)")
plt.ylabel("Audience Count")
plt.grid()
plt.show()


In [None]:
# Inflation vs Audience
sns.scatterplot(x="InflationRate", y="TotalAudience", data=df)
plt.title("Inflation Rate vs Audience")
plt.xlabel("Inflation Rate (%)")
plt.ylabel("Audience Count")
plt.grid()
plt.show()


In [None]:
# Clean inflation format
df["InflationRate"] = df["InflationRate"].astype(str).str.replace(",", ".")
df["InflationRate"] = pd.to_numeric(df["InflationRate"], errors="coerce")

# Correlation Test
corr, p_val = pearsonr(df["GDP"].dropna(), df["TotalAudience"].dropna())
print(f"GDP-Audience Correlation: {corr:.3f}")
print(f"P-value: {p_val:.4f}")


In [None]:
features = df[["GDP", "InflationRate"]].dropna()
target = df.loc[features.index, "TotalAudience"]

scaler = StandardScaler()
X_scaled = scaler.fit_transform(features)

model = LinearRegression()
model.fit(X_scaled, target)
predictions = model.predict(X_scaled)

rmse = mean_squared_error(target, predictions, squared=False)
r2 = r2_score(target, predictions)

print(f"RMSE: {rmse:.2f}")
print(f"R^2 Score: {r2:.3f}")


In [None]:
plt.plot(df["Year"].iloc[features.index], target, label="Actual")
plt.plot(df["Year"].iloc[features.index], predictions, label="Predicted", linestyle="--")
plt.title("Actual vs Predicted Movie Attendance")
plt.xlabel("Year")
plt.ylabel("Audience Count")
plt.legend()
plt.grid()
plt.show()


### 📌 Conclusion

- The **GDP-Audience correlation was 0.626** with a **p-value of 0.0011**, indicating a significant positive relationship.
- The **linear regression model yielded an R² score of 0.392**, showing moderate predictive power.
- These findings suggest that economic growth is associated with higher movie theater attendance.
- The model may be improved by including more variables such as consumer confidence, exchange rate, or tourism statistics.
