In [None]:
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.linear_model import LinearRegression
from sklearn.metrics import mean_squared_error, r2_score
from sklearn.preprocessing import OneHotEncoder


data = pd.read_csv('happiness_score_dataset.csv')


print(data.head())


print(data.isnull().sum())


data.dropna(inplace=True)


ohe = OneHotEncoder(sparse=False, drop='first')
encoded_regions = ohe.fit_transform(data[['Region']])
encoded_df = pd.DataFrame(encoded_regions, columns=ohe.get_feature_names(['Region']))
data_encoded = pd.concat([data.drop(['Region'], axis=1), encoded_df], axis=1)


X = data_encoded.drop(['Happiness Score'], axis=1)
y = data_encoded['Happiness Score']


X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)


model = LinearRegression()
model.fit(X_train, y_train)


y_pred = model.predict(X_test)
mse = mean_squared_error(y_test, y_pred)
r2 = r2_score(y_test, y_pred)

print('Mean Squared Error:', mse)
print('R-squared:', r2)


new_features = pd.DataFrame({
    'GDP per Capita': [1.2],
    'Family': [1.5],
    'Life Expectancy': [0.9],
    'Freedom': [0.8],
    'Generosity': [0.7],
    'Trust Government Corruption': [0.3],
    'Region': ['Sub-Saharan Africa']
})


encoded_new_regions = ohe.transform(new_features[['Region']])
encoded_new_df = pd.DataFrame(encoded_new_regions, columns=ohe.get_feature_names(['Region']))
new_features_encoded = pd.concat([new_features.drop(['Region'], axis=1), encoded_new_df], axis=1)

predicted_score = model.predict(new_features_encoded)
print('Predicted Happiness Score:', predicted_score)


In [None]:
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.ensemble import RandomForestClassifier
from sklearn.metrics import accuracy_score


url = "https://github.com/dsrscientist/dataset1/blob/master/titanic_train.csv"
data = pd.read_csv(url)


data = data.drop(['PassengerId', 'Name', 'Ticket', 'Cabin'], axis=1)


data['Sex'] = data['Sex'].map({'female': 0, 'male': 1})
data['Embarked'] = data['Embarked'].map({'S': 0, 'C': 1, 'Q': 2})


data['Age'].fillna(data['Age'].median(), inplace=True)
data['Embarked'].fillna(data['Embarked'].mode()[0], inplace=True)


X = data.drop('Survived', axis=1)
y = data['Survived']
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)


model = RandomForestClassifier(random_state=42)
model.fit(X_train, y_train)


y_pred = model.predict(X_test)


accuracy = accuracy_score(y_test, y_pred)
print("Accuracy:", accuracy)
