In [17]:
import pandas as pd
import numpy as np
from sklearn.linear_model import LinearRegression
import matplotlib.pyplot as plt

def build_linear_model(df, x_var, y_var, dataset_label):
    """
    Builds and plots a linear regression model for the given dataset.
    
    Args:
    df: Pandas DataFrame containing the data
    x_var: The independent variable (e.g., 'budget')
    y_var: The dependent variable (e.g., 'revenue')
    dataset_label: A string label for the dataset (e.g., 'English Movies')
    
    Returns:
    Linear model coefficients and plot
    """
    # Reshape data for sklearn
    X = df[[x_var]]  # Independent variable (budget)
    y = df[y_var]    # Dependent variable (revenue)
    
    # Create and fit the linear regression model
    model = LinearRegression()
    model.fit(X, y)
    
    # Get model parameters
    intercept = model.intercept_
    coefficient = model.coef_[0]
    
    # Print the linear model equation
    print(f'Linear Model for {dataset_label}: Revenue = {intercept:.2f} + {coefficient:.6f} * Budget')
    
    # Predict values using the model
    y_pred = model.predict(X)
    
    # Plotting the data and the regression line
    plt.scatter(X, y, color='blue', label='Actual data')
    plt.plot(X, y_pred, color='red', label='Fitted line')
    plt.title(f'{dataset_label}: Budget vs Revenue')
    plt.xlabel(x_var)
    plt.ylabel(y_var)
    plt.legend()
    plt.grid(True)
    plt.show()

    return model

# Load JSON datasets from the same directory
df_english = pd.read_json('english_movies.json')
df_french = pd.read_json('french_movies.json')

# Build and plot the linear model for English movies
model_english = build_linear_model(df_english, 'budget', 'revenue', 'English Movies')

# Build and plot the linear model for French movies
model_french = build_linear_model(df_french, 'budget', 'revenue', 'French Movies')


FileNotFoundError: File english_movies.json does not exist

In [19]:
import pandas as pd

In [21]:
df = pd.read_json("english_movies.json")

FileNotFoundError: File english_movies.json does not exist