In [None]:
param_grid = {
    'learning_rate': [0.01, 0.1, 0.2],
    'max_depth': [3, 4, 5],
    'n_estimators': [100, 200, 300],
}

In [2]:
# Import necessary libraries
import pandas as pd
import numpy as np
from sklearn.datasets import load_iris
from sklearn.model_selection import train_test_split
from sklearn.metrics import accuracy_score
from xgboost import XGBClassifier

# Step 1: Load and Prepare the Iris Dataset
iris = load_iris()
X = iris.data  # Features
y = iris.target  # Target labels

# Step 2: Split the Data into Training and Testing Sets
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

# Step 3: Initialize and Configure the XGBoost Model
model = XGBClassifier(
    objective='multi:softmax',  # Multiclass classification
    num_class=3,                # Number of classes (Iris species)
    seed=42                     # Random seed for reproducibility
)

# Step 4: Train the XGBoost Model
model.fit(X_train, y_train)

# Step 5: Make Predictions on the Test Set
y_pred = model.predict(X_test)

# Step 6: Evaluate the Model
accuracy = accuracy_score(y_test, y_pred)
print(f"Accuracy: {accuracy:.2f}")

# Step 7 (Optional): Feature Importance
importances = model.feature_importances_
feature_names = iris.feature_names
feature_importance_df = pd.DataFrame({'Feature': feature_names, 'Importance': importances})
print("Feature Importance:")
print(feature_importance_df)


Accuracy: 1.00
Feature Importance:
             Feature  Importance
0  sepal length (cm)    0.011077
1   sepal width (cm)    0.029049
2  petal length (cm)    0.752451
3   petal width (cm)    0.207423


In [3]:
# importances = model.feature_importances_

In [5]:
# Import necessary libraries
import pandas as pd
import numpy as np
from sklearn.datasets import load_iris
from sklearn.model_selection import train_test_split
from sklearn.metrics import accuracy_score
from xgboost import XGBClassifier

# Step 1: Load and Prepare the Iris Dataset
iris = load_iris()
X = iris.data  # Features
y = iris.target  # Target labels

# Step 2: Split the Data into Training and Testing Sets
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

# Step 3: Initialize and Configure the XGBoost Model
param_grid = {
    'learning_rate': [0.01, 0.1, 0.2],
    'max_depth': [3, 4, 5],
    'n_estimators': [100, 200, 300],
}
model = XGBClassifier(param_grid)

# Step 4: Train the XGBoost Model
model.fit(X_train, y_train)

# Step 5: Make Predictions on the Test Set
y_pred = model.predict(X_test)

# Step 6: Evaluate the Model
accuracy = accuracy_score(y_test, y_pred)
print(f"Accuracy: {accuracy:.2f}")

# Step 7 (Optional): Feature Importance
importances = model.feature_importances_
feature_names = iris.feature_names
feature_importance_df = pd.DataFrame({'Feature': feature_names, 'Importance': importances})
print("Feature Importance:")
print(feature_importance_df)


Accuracy: 1.00
Feature Importance:
             Feature  Importance
0  sepal length (cm)    0.011077
1   sepal width (cm)    0.029049
2  petal length (cm)    0.752451
3   petal width (cm)    0.207423




In [19]:
# make_blobs.__dir__()

In [24]:
# from sklearn.datasets import load_iris, make_blobs
# iris = make_blobs(n_samples=100, n_features=2)
# print(iris)

In [29]:
# Import necessary libraries
import pandas as pd
import numpy as np
from sklearn.datasets import load_iris, make_blobs
from sklearn.model_selection import train_test_split
from sklearn.metrics import accuracy_score
from xgboost import XGBClassifier

# Step 1: Load and Prepare the Iris Dataset
dataset = make_blobs(n_samples=10000, n_features=50, centers=3)
X = dataset[0]  # Features
y = dataset[1]  # Target labels

# Step 2: Split the Data into Training and Testing Sets
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

# Step 3: Initialize and Configure the XGBoost Model
param_grid = {
    'learning_rate': [0.01, 0.1, 0.2],
    'max_depth': [3, 4, 5],
    'n_estimators': [100, 200, 300],
}
model = XGBClassifier(param_grid)

# Step 4: Train the XGBoost Model
model.fit(X_train, y_train)

# Step 5: Make Predictions on the Test Set
y_pred = model.predict(X_test)

# Step 6: Evaluate the Model
accuracy = accuracy_score(y_test, y_pred)
print(f"Accuracy: {accuracy:.2f}")

# Step 7 (Optional): Feature Importance
importances = model.feature_importances_
feature_names = ["feature 1", "feature 2"]
# feature_importance_df = pd.DataFrame({'Feature': feature_names, 'Importance': importances})
# print("Feature Importance:")
# print(feature_importance_df)


Accuracy: 1.00


In [33]:
# Import necessary libraries
import pandas as pd
import numpy as np
from sklearn.datasets import load_iris
from sklearn.model_selection import train_test_split
from sklearn.metrics import accuracy_score
from xgboost import XGBClassifier

# Step 1: Load and Prepare the Iris Dataset
dataset = pd.read_csv("diabetes.csv")
X = dataset.drop(columns="Outcome")  # Features
y = dataset.Outcome  # Target labels

# Step 2: Split the Data into Training and Testing Sets
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

# Step 3: Initialize and Configure the XGBoost Model
param_grid = {
    'learning_rate': [0.01, 0.1, 0.2],
    'max_depth': [3, 4, 5],
    'n_estimators': [100, 200, 300],
}
model = XGBClassifier()

# Step 4: Train the XGBoost Model
model.fit(X_train, y_train)

# Step 5: Make Predictions on the Test Set
y_pred = model.predict(X_test)

# Step 6: Evaluate the Model
accuracy = accuracy_score(y_test, y_pred)
print(f"Accuracy: {accuracy:.2f}")

# Step 7 (Optional): Feature Importance
importances = model.feature_importances_
feature_names = X.columns
feature_importance_df = pd.DataFrame({'Feature': feature_names, 'Importance': importances})
print("Feature Importance:")
print(feature_importance_df)


Accuracy: 0.69

Feature Importance:
                    Feature  Importance
0               Pregnancies    0.072386
1                   Glucose    0.247188
2             BloodPressure    0.093273
3             SkinThickness    0.098815
4                   Insulin    0.115176
5                       BMI    0.143292
6  DiabetesPedigreeFunction    0.090128
7                       Age    0.139741


In [7]:
# Import necessary libraries
import pandas as pd
import numpy as np
from sklearn.datasets import load_iris
from sklearn.model_selection import train_test_split
from sklearn.metrics import accuracy_score
from xgboost import XGBClassifier

# Step 1: Load and Prepare the Iris Dataset
dataset = pd.read_csv("diabetes.csv")
X = dataset.drop(columns="Outcome")  # Features
y = dataset.Outcome  # Target labels

# Step 2: Split the Data into Training and Testing Sets
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

# Step 3: Initialize and Configure the XGBoost Model
param_grid = {
    'learning_rate': [0.01, 0.1, 0.2],
    'max_depth': [3, 4, 5],
    'n_estimators': [100, 200, 300],
}
model = XGBClassifier(n_estimators=100, learning_rate=0.4, max_depth=9)

# Step 4: Train the XGBoost Model
model.fit(X_train, y_train)

# Step 5: Make Predictions on the Test Set
y_pred = model.predict(X_test)

# Step 6: Evaluate the Model
accuracy = accuracy_score(y_test, y_pred)
print(f"Accuracy: {accuracy:.2f}")

# Step 7 (Optional): Feature Importance
feature_importance_df = pd.DataFrame({'Feature': X.columns, 'Importance': model.feature_importances_})
print("Feature Importance:")
# print(feature_importance_df)
feature_importance_df

Accuracy: 0.71
Feature Importance:


Unnamed: 0,Feature,Importance
0,Pregnancies,0.091321
1,Glucose,0.256443
2,BloodPressure,0.09989
3,SkinThickness,0.084641
4,Insulin,0.115005
5,BMI,0.13126
6,DiabetesPedigreeFunction,0.092902
7,Age,0.128538


In [10]:
dataset.head(3)

Unnamed: 0,Pregnancies,Glucose,BloodPressure,SkinThickness,Insulin,BMI,DiabetesPedigreeFunction,Age,Outcome
0,6,148,72,35,0,33.6,0.627,50,1
1,1,85,66,29,0,26.6,0.351,31,0
2,8,183,64,0,0,23.3,0.672,32,1
