In [None]:
from sklearn.model_selection import train_test_split
from sklearn.linear_model import LogisticRegression
from sklearn.metrics import accuracy_score

# Assume X and y are your features and labels
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

model = LogisticRegression()
model.fit(X_train, y_train)

predictions = model.predict(X_test)
accuracy = accuracy_score(y_test, predictions)

print("Holdout Validation Accuracy:", accuracy)


In [None]:
from sklearn.model_selection import KFold
from sklearn.model_selection import cross_val_score
from sklearn.linear_model import LogisticRegression

# Assume X and y are your features and labels
kf = KFold(n_splits=5, shuffle=True, random_state=42)
model = LogisticRegression()

cv_results = cross_val_score(model, X, y, cv=kf, scoring='accuracy')

print("K-Fold Cross-Validation Accuracy:", cv_results.mean())


In [None]:
from sklearn.model_selection import StratifiedKFold
from sklearn.model_selection import cross_val_score
from sklearn.linear_model import LogisticRegression

# Assume X and y are your features and labels
skf = StratifiedKFold(n_splits=5, shuffle=True, random_state=42)
model = LogisticRegression()

cv_results = cross_val_score(model, X, y, cv=skf, scoring='accuracy')

print("Stratified K-Fold Cross-Validation Accuracy:", cv_results.mean())


In [None]:
from sklearn.model_selection import LeavePOut
from sklearn.model_selection import cross_val_score
from sklearn.linear_model import LogisticRegression

# Assume X and y are your features and labels
lpo = LeavePOut(p=2)  # Leave 2 samples out
model = LogisticRegression()

cv_results = cross_val_score(model, X, y, cv=lpo, scoring='accuracy')

print("Leave-P-Out Cross-Validation Accuracy:", cv_results.mean())


In [None]:
from sklearn.model_selection import TimeSeriesSplit
from sklearn.model_selection import cross_val_score
from sklearn.linear_model import LogisticRegression

# Assume X and y are your features and labels, and time is the timestamp or time-related feature
tscv = TimeSeriesSplit(n_splits=5)
model = LogisticRegression()

cv_results = cross_val_score(model, X, y, cv=tscv, scoring='accuracy')

print("Time Series Cross-Validation Accuracy:", cv_results.mean())


In [None]:
from sklearn.model_selection import RepeatedKFold
from sklearn.model_selection import cross_val_score
from sklearn.linear_model import LogisticRegression

# Assume X and y are your features and labels
rkf = RepeatedKFold(n_splits=5, n_repeats=3, random_state=42)
model = LogisticRegression()

cv_results = cross_val_score(model, X, y, cv=rkf, scoring='accuracy')

print("Repeated K-Fold Cross-Validation Accuracy:", cv_results.mean())


In [None]:
from sklearn.model_selection import cross_val_score
from sklearn.model_selection import KFold
from sklearn.model_selection import GridSearchCV
from sklearn.ensemble import RandomForestClassifier

# Assume X and y are your features and labels
kf_outer = KFold(n_splits=5, shuffle=True, random_state=42)
model = RandomForestClassifier()

param_grid = {'n_estimators': [10, 50, 100], 'max_depth': [None, 10, 20]}
grid_search = GridSearchCV(estimator=model, param_grid=param_grid, scoring='accuracy', cv=kf_outer)

cv_results = cross_val_score(grid_search, X, y, cv=kf_outer, scoring='accuracy')

print("Nested Cross-Validation Accuracy:", cv_results.mean())


In [None]:
from sklearn.model_selection import GroupKFold
from sklearn.model_selection import cross_val_score
from sklearn.linear_model import LogisticRegression

# Assume X and y are your features and labels, and groups is an array specifying the group for each sample
gkf = GroupKFold(n_splits=5)
model = LogisticRegression()

cv_results = cross_val_score(model, X, y, groups=groups, cv=gkf, scoring='accuracy')

print("Group K-Fold Cross-Validation Accuracy:", cv_results.mean())
