In [1]:
# Example 1: Chi-Squared Test with Real-Time Dataset

# Load Titanic dataset and perform Chi-Squared Test on 'Survived' vs 'Pclass'
import pandas as pd
import numpy as np
from scipy.stats import chi2_contingency

# Load dataset
url = 'https://raw.githubusercontent.com/datasciencedojo/datasets/master/titanic.csv'
df = pd.read_csv(url)

# Create contingency table
contingency_table = pd.crosstab(df['Survived'], df['Pclass'])
print("Contingency Table:\n", contingency_table)

# Perform Chi-Squared Test
chi2, p, dof, expected = chi2_contingency(contingency_table)
print(f"\nChi-squared Value: {chi2}")
print(f"P-value: {p}")
print(f"Degrees of Freedom: {dof}")
print("Expected Frequencies:\n", expected)

if p < 0.05:
    print("\nConclusion: Reject Null Hypothesis - Survival is related to Passenger Class.")
else:
    print("\nConclusion: Fail to Reject Null Hypothesis - Survival is independent of Passenger Class.")



Contingency Table:
 Pclass      1   2    3
Survived              
0          80  97  372
1         136  87  119

Chi-squared Value: 102.88898875696056
P-value: 4.549251711298793e-23
Degrees of Freedom: 2
Expected Frequencies:
 [[133.09090909 113.37373737 302.53535354]
 [ 82.90909091  70.62626263 188.46464646]]

Conclusion: Reject Null Hypothesis - Survival is related to Passenger Class.


In [2]:

# Example 2: Confidence Intervals on Real-Time Dataset

import numpy as np
import pandas as pd
from scipy import stats

# Load dataset
url = 'https://raw.githubusercontent.com/jbrownlee/Datasets/master/housing.data'
column_names = ['CRIM', 'ZN', 'INDUS', 'CHAS', 'NOX', 'RM', 'AGE', 'DIS', 'RAD', 'TAX', 'PTRATIO', 'B', 'LSTAT', 'MEDV']
df = pd.read_csv(url, delim_whitespace=True, names=column_names)

# Calculate Confidence Interval for mean of 'MEDV'
data = df['MEDV']
mean = np.mean(data)
std = np.std(data, ddof=1)
n = len(data)

confidence = 0.95
z_score = stats.norm.ppf((1 + confidence) / 2)
margin_error = z_score * (std / np.sqrt(n))
ci_lower = mean - margin_error
ci_upper = mean + margin_error

print(f"Mean House Price: {mean:.2f}")
print(f"95% Confidence Interval: ({ci_lower:.2f}, {ci_upper:.2f})")



  df = pd.read_csv(url, delim_whitespace=True, names=column_names)


Mean House Price: 22.53
95% Confidence Interval: (21.73, 23.33)


In [8]:

# Example 3: Error Metrics with Streamlit Interactive Dashboard

# Save this as app.py and run using: streamlit run app.py
!pip install streamlit
import streamlit as st
import pandas as pd
import numpy as np
from sklearn.linear_model import LinearRegression
from sklearn.metrics import mean_absolute_error, mean_squared_error, r2_score
import matplotlib.pyplot as plt

st.title("Regression Error Metrics Calculator")

# Load Dataset
url = 'https://raw.githubusercontent.com/jbrownlee/Datasets/master/housing.data'
columns = ['CRIM', 'ZN', 'INDUS', 'CHAS', 'NOX', 'RM', 'AGE', 'DIS', 'RAD', 'TAX', 'PTRATIO', 'B', 'LSTAT', 'MEDV']
df = pd.read_csv(url, delim_whitespace=True, names=columns)

# Feature Selection
features = st.multiselect("Select features:", options=columns[:-1], default=['RM', 'LSTAT'])

if features:
    X = df[features]
    y = df['MEDV']

    # Model Training
    model = LinearRegression()
    model.fit(X, y)
    y_pred = model.predict(X)

    # Error Metrics
    mae = mean_absolute_error(y, y_pred)
    mse = mean_squared_error(y, y_pred)
    rmse = np.sqrt(mse)
    r2 = r2_score(y, y_pred)

    st.write(f"**MAE**: {mae:.2f}")
    st.write(f"**MSE**: {mse:.2f}")
    st.write(f"**RMSE**: {rmse:.2f}")
    st.write(f"**R² Score**: {r2:.2f}")

    # Plot Actual vs Predicted
    fig, ax = plt.subplots()
    ax.scatter(y, y_pred, color='blue')
    ax.plot([y.min(), y.max()], [y.min(), y.max()], 'k--', lw=2)
    ax.set_xlabel('Actual')
    ax.set_ylabel('Predicted')
    ax.set_title('Actual vs Predicted')
    st.pyplot(fig)





  df = pd.read_csv(url, delim_whitespace=True, names=columns)


In [11]:
import requests

try:
    ip = requests.get('https://api.ipify.org').text
    print(f"Your public IP address is: {ip}")
except requests.RequestException:
    print("Could not retrieve public IP address.")

Your public IP address is: 34.125.14.13


In [None]:
#!npm install -g localtunnel
!streamlit run app.py &>/dev/null& lt --port 8501
#!streamlit run app.py

your url is: https://flat-lands-burn.loca.lt
