<a href="https://colab.research.google.com/github/Prashasticodes/Cancer-Regression-/blob/main/Copy_of_breast_Cancer_prediction_(1).ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

In [None]:
# Import necessary libraries
import pandas as pd
from sklearn.datasets import load_breast_cancer
from sklearn.model_selection import train_test_split
from sklearn.ensemble import RandomForestRegressor
from sklearn.metrics import mean_squared_error, r2_score

# Step 1: Load the dataset
cancer_data = load_breast_cancer()
data = pd.DataFrame(data=cancer_data.data, columns=cancer_data.feature_names)

# Note: The dataset does not contain a direct regression target, so for demonstration, we can create a target
# For example, we could use the mean radius as a target for a regression task
# Here, we assume that we're predicting the mean radius as a continuous target variable
data['target'] = cancer_data.target  # This is typically a classification target (0 or 1)

# Step 2: Feature selection
features = data.columns[:-1]  # All columns except the target
X = data[features]  # Features
y = data['target']  # Target variable

# Step 3: Data splitting
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

# Step 4: Model training
model = RandomForestRegressor(n_estimators=100, random_state=42)
model.fit(X_train, y_train)

# Step 5: Predictions
y_pred = model.predict(X_test)

# Step 6: Model evaluation
mse = mean_squared_error(y_test, y_pred)
r2 = r2_score(y_test, y_pred)

# Output evaluation metrics
print(f'Mean Squared Error: {mse}')
print(f'R-squared: {r2}')

# Calculate accuracy percentage
accuracy_percentage = r2 * 100
print(f'Accuracy Percentage: {accuracy_percentage:.2f}%')

# Optional: Feature Importance
importances = model.feature_importances_
feature_importance_df = pd.DataFrame({'feature': features, 'importance': importances})
print("\nFeature Importances:")
print(feature_importance_df.sort_values(by='importance', ascending=False))



Mean Squared Error: 0.03276140350877193
R-squared: 0.8605413691451032
Accuracy Percentage: 86.05%

Feature Importances:
                    feature  importance
27     worst concave points    0.269936
7       mean concave points    0.202781
22          worst perimeter    0.158947
23               worst area    0.118171
20             worst radius    0.103470
21            worst texture    0.025475
1              mean texture    0.021067
26          worst concavity    0.011771
13               area error    0.010239
24         worst smoothness    0.008456
4           mean smoothness    0.006652
16          concavity error    0.006587
19  fractal dimension error    0.005278
3                 mean area    0.005143
6            mean concavity    0.004656
28           worst symmetry    0.004215
12          perimeter error    0.003913
11            texture error    0.003764
10             radius error    0.003696
18           symmetry error    0.003541
14         smoothness error    0.003475
