In [3]:
import pandas as pd

# Sample data
data = {
    'Student': ['Alice', 'Bob', 'Charlie', 'David', 'Eve'],
    'Math': [85, 78, None, 92, 88],
    'Science': [90, None, 85, 88, 92],
    'English': [None, 82, 78, 85, 90]
}

# Create DataFrame
df = pd.DataFrame(data)
print("Original DataFrame:")
print(df)
# Forward fill missing values
df_ffill = df.fillna(method='ffill')
print("\nDataFrame after forward fill:")
print(df_ffill)



Original DataFrame:
   Student  Math  Science  English
0    Alice  85.0     90.0      NaN
1      Bob  78.0      NaN     82.0
2  Charlie   NaN     85.0     78.0
3    David  92.0     88.0     85.0
4      Eve  88.0     92.0     90.0

DataFrame after forward fill:
   Student  Math  Science  English
0    Alice  85.0     90.0      NaN
1      Bob  78.0     90.0     82.0
2  Charlie  78.0     85.0     78.0
3    David  92.0     88.0     85.0
4      Eve  88.0     92.0     90.0


  df_ffill = df.fillna(method='ffill')


In [4]:
from sklearn.model_selection import train_test_split
from sklearn.linear_model import LinearRegression
from sklearn.metrics import mean_squared_error

data = {
    'Previous_Scores': [85, 78, 88, 92, 75],
    'Current_Scores': [88, 80, 90, 95, 78]
}

df = pd.DataFrame(data)

X = df[['Previous_Scores']]
y = df['Current_Scores']

X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)
model = LinearRegression()
model.fit(X_train, y_train)
y_pred = model.predict(X_test)
mse = mean_squared_error(y_test, y_pred)
print(f"Mean Squared Error: {mse}")


Mean Squared Error: 0.7795325268386474


In [6]:
from sklearn.model_selection import train_test_split
from sklearn.tree import DecisionTreeClassifier
from sklearn.metrics import accuracy_score

data = {
    'Credit_History': [1, 0, 1, 1, 0],
    'Income': [50000, 30000, 60000, 70000, 20000],
    'Loan_Status': [1, 0, 1, 1, 0]
}

df = pd.DataFrame(data)

X = df[['Credit_History', 'Income']]
y = df['Loan_Status']

X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)
model = DecisionTreeClassifier()
model.fit(X_train, y_train)

y_pred = model.predict(X_test)

accuracy = accuracy_score(y_test, y_pred)
print(f"Accuracy: {accuracy}")


Accuracy: 1.0


In [7]:
from sklearn.feature_extraction.text import CountVectorizer
from sklearn.naive_bayes import MultinomialNB
from sklearn.metrics import accuracy_score

emails = ['Free money now!!!', 'Meeting at 10am', 'Win a free iPhone', 'Lunch at noon?', 'Get rich quick']
labels = [1, 0, 1, 0, 1]  # 1 for spam, 0 for not 

df = pd.DataFrame({'Email': emails, 'Label': labels})

X = df['Email']
y = df['Label']

vectorizer = CountVectorizer()
X = vectorizer.fit_transform(X)
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

model = MultinomialNB()
model.fit(X_train, y_train)

y_pred = model.predict(X_test)

accuracy = accuracy_score(y_test, y_pred)
print(f"Accuracy: {accuracy}")


Accuracy: 1.0


In [8]:
from sklearn.model_selection import train_test_split
from sklearn.neighbors import KNeighborsClassifier
from sklearn.metrics import accuracy_score

data = {
    'Symptom1': [1, 0, 1, 1, 0],
    'Symptom2': [0, 1, 1, 0, 1],
    'Disease': [0, 1, 0, 0, 1]  # 0 for Disease A, 1 for Disease B
}

df = pd.DataFrame(data)

X = df[['Symptom1', 'Symptom2']]
y = df['Disease']

X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)
model = KNeighborsClassifier(n_neighbors=3)
model.fit(X_train, y_train)

y_pred = model.predict(X_test)

accuracy = accuracy_score(y_test, y_pred)
print(f"Accuracy: {accuracy}")


Accuracy: 0.0


In [9]:
from sklearn.model_selection import train_test_split
from sklearn.linear_model import LinearRegression
from sklearn.metrics import mean_squared_error

data = {
    'Size': [1500, 2000, 2500, 1800, 2200],
    'Price': [300000, 400000, 500000, 350000, 450000]
}

df = pd.DataFrame(data)

X = df[['Size']]
y = df['Price']

X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)
model = LinearRegression()
model.fit(X_train, y_train)

y_pred = model.predict(X_test)

mse = mean_squared_error(y_test, y_pred)
print(f"Mean Squared Error: {mse}")


Mean Squared Error: 0.0


In [12]:
from sklearn.model_selection import train_test_split
from sklearn.neighbors import KNeighborsClassifier
from sklearn.metrics import accuracy_score

data = {
    'Symptom1': [1, 0, 1, 1, 0],
    'Symptom2': [0, 1, 1, 0, 1],
    'Disease': [0, 1, 0, 0, 1]  # 0 for Disease A, 1 for Disease B
}

df = pd.DataFrame(data)

X = df[['Symptom1', 'Symptom2']]
y = df['Disease']

X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)
model = KNeighborsClassifier(n_neighbors=3)
model.fit(X_train, y_train)

y_pred = model.predict(X_test)

# Evaluate the model
accuracy = accuracy_score(y_test, y_pred)
print(f"Accuracy: {accuracy}")


Accuracy:55.3
