In [None]:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
from sklearn.model_selection import train_test_split
from sklearn.linear_model import LinearRegression
from sklearn import metrics

In [None]:
# Load dataset (replace with actual dataset path)
dataset = pd.read_csv("weather.csv")

# Visualize data
dataset.plot(x = 'MinTemp', y = 'MaxTemp', style = 'o')
plt.title('MinTemp vs MaxTemp')
plt.xlabel('MinTemp')
plt.ylabel('MaxTemp')
plt.show()

In [None]:
# Prepare data
x = dataset['MinTemp'].values.reshape(-1, 1) 
  
y = dataset['MaxTemp'].values.reshape(-1, 1)

# Split dataset
x_train, x_test, y_train, y_test = train_test_split(x, y, test_size = 0.2, random_state = 0)

In [None]:
# Train model
regressor = LinearRegression()
regressor.fit(x_train, y_train)

# Display coefficients
print("Intercept: ", regressor.intercept_)
print("Slope: ", regressor.coef_)

# Predict values
y_pred = regressor.predict(x_test)

# Compare actual vs predicted
df = pd.DataFrame({'Actual': y_test.flatten(), 'Predicted': y_pred.flatten()})
print(df)

# Plot prediction
plt.scatter(x_test, y_test, color = 'gray') 
plt.plot(x_test, y_pred, color = 'red', linewidth = 2)
plt.show()

In [None]:
from sklearn.datasets import make_blobs
from sklearn.svm import SVC

# Generate synthetic dataset
X, Y = make_blobs(n_samples = 500, centers = 2, random_state = 0, cluster_std = 0.4)

# Plot dataset
plt.scatter(X[:, 0], X[:, 1], c = Y, s = 50, cmap = 'spring')
plt.show()

# Train SVM classifier
clf = SVC(kernel = 'linear') 
clf.fit(X, Y)

# Predict new samples
print("Prediction for [1.5, 2.5]: ", clf.predict([[1.5, 2.5]]))
print("Prediction for [3, 1]: ", clf.predict([[3, 1]]))

In [None]:
from sklearn.preprocessing import StandardScaler 
from sklearn.metrics import classification_report, accuracy_score 

# Load dataset (replace with actual dataset path)
df = pd.read_csv("cancer.csv") 

# Drop non-numeric columns (State Column)
df = df.drop(columns = ['State'])

# Define target variable (Creating a binary classification high vs low cancer rate)
# We use "Total.Rate" (cancer rate) and classify as high (1) or Low (0) based on the median split 
median_rate = df['Total.Rate'].median()
df['Cancer_Class'] = (df['Total.Rate'] > median_rate).astype(int)

# Select features (all numeric except target)
X = df.drop(columns = ['Cancer_Class', 'Total.Rate']).values # Features
Y = df['Cancer_Class'].values # Labels ( 0 = Low Cancer Rate, 1 = High Cancer Rate)

In [None]:
# Split dataset into training (80%) and testing (20%)
x_train, x_test, y_train, y_test = train_test_split(x, y, test_size=0.2, random_state=42)

# Standardize the data for better performance
scaler = StandardScaler()
x_train = scaler.fit_transform(x_train) 
x_test = scaler.transform(x_test)

# Scale only numeric data

# Train SVM classifier
clf = SVC(kernel='linear')
clf.fit(x_train, y_train)

# Predict on test data
y_pred = clf.predict(x_test)

# Print accuracy and classification report
print("Accuracy:", accuracy_score(y_test, y_pred))
print("Inclassification Report:\n", classification_report(y_test, y_pred))