In [None]:
import numpy as np
import matplotlib.pyplot as plt

# Generate data
x = np.linspace(0, 10, 100)
y = np.sin(x)

# Plot data
plt.figure(figsize=(8, 6))
plt.plot(x, y, label='sin(x)')
plt.title('Sine Function')
plt.xlabel('x')
plt.ylabel('sin(x)')
plt.legend()
plt.grid(True)
plt.show()


In [None]:
# Jupyter Notebook Project: Data Analysis and Machine Learning

## 1. Data Loading and Preprocessing

import pandas as pd

# Load dataset
df = pd.read_csv('data.csv')

# Data preprocessing
# Example: Handle missing values
df.fillna(0, inplace=True)

# Example: Encode categorical variables
df = pd.get_dummies(df, columns=['category'])

## 2. Exploratory Data Analysis (EDA)

import matplotlib.pyplot as plt
import seaborn as sns

# Visualize data distributions
sns.histplot(df['column'], bins=20, kde=True)
plt.title('Distribution of Column X')
plt.xlabel('Values')
plt.ylabel('Frequency')
plt.show()

# Explore correlations
correlation_matrix = df.corr()
sns.heatmap(correlation_matrix, annot=True, cmap='coolwarm')
plt.title('Correlation Matrix')
plt.show()

## 3. Machine Learning Model

from sklearn.model_selection import train_test_split
from sklearn.ensemble import RandomForestClassifier
from sklearn.metrics import accuracy_score, classification_report

# Prepare data
X = df.drop(columns=['target_column'])
y = df['target_column']
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

# Build model
model = RandomForestClassifier(random_state=42)
model.fit(X_train, y_train)

# Evaluate model
y_pred = model.predict(X_test)
accuracy = accuracy_score(y_test, y_pred)
print(f'Accuracy: {accuracy:.2f}')

# Classification report
print(classification_report(y_test, y_pred))

# Save trained model
import joblib
joblib.dump(model, 'model.pkl')
