Load the dataset from a CSV file.

In [None]:
import pandas as pd

dataset = pd.read_csv('path/to/dataset.csv')

Display the first few rows of the dataset.

In [None]:
print(dataset.head())

Retrieve the names of the columns.

In [None]:
column_names = dataset.columns.tolist()

Rename columns as needed.

In [None]:
dataset.rename(columns={'old_name':'new_name'}, inplace=True)

Get the shape (rows, columns) of the dataset.

In [None]:
shape = dataset.shape

Check the dataset information like data types.

In [None]:
dataset.info()

Get statistical summary of numerical columns.

In [None]:
summary = dataset.describe()

Check for missing values in the dataset.

In [None]:
missing_values = dataset.isnull().sum()

Create scatter plots for exploratory data analysis.

In [None]:
import matplotlib.pyplot as plt
import seaborn as sns
sns.pairplot(dataset)

Plot a histogram for a specific column.

In [None]:
plt.hist(dataset['column_name'])
plt.show()

Generate a correlation heatmap.

In [None]:
correlation = dataset.corr()
sns.heatmap(correlation, annot=True, cmap='coolwarm')
plt.show()

Split the dataset into features and target.

In [None]:
X = dataset.drop('target_column', axis=1)
y = dataset['target_column']

Perform a train-test split.

In [None]:
from sklearn.model_selection import train_test_split
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

Train the model using training data.

In [None]:
from sklearn.linear_model import LinearRegression
model = LinearRegression()
model.fit(X_train, y_train)

Print the model coefficients.

In [None]:
print(model.coef_)

Print a summary of the model.

In [None]:
import statsmodels.api as sm
X_train_sm = sm.add_constant(X_train)
model_sm = sm.OLS(y_train, X_train_sm).fit()
print(model_sm.summary())

Evaluate the model on test data.

In [None]:
model.evaluate(X_test, y_test)

Fit the model and make predictions.

In [None]:
predictions = model.predict(X_test)

Generate predictions for new data.

In [None]:
new_data_predictions = model.predict(new_data)