# TrabalhoDatamining Sample Notebook

This notebook demonstrates basic data mining workflow using pandas, scikit-learn, and matplotlib.

In [None]:
import pandas as pd
import matplotlib.pyplot as plt
from sklearn.datasets import load_iris
from sklearn.model_selection import train_test_split
from sklearn.ensemble import RandomForestClassifier
from sklearn.metrics import accuracy_score

## Load and Explore Data

In [None]:
iris = load_iris()
df = pd.DataFrame(iris.data, columns=iris.feature_names)
df['target'] = iris.target
df.head()

## Visualize Data

In [None]:
plt.figure(figsize=(8, 6))
for i, target_name in enumerate(iris.target_names):
    plt.scatter(df[df['target'] == i]['sepal length (cm)'], df[df['target'] == i]['sepal width (cm)'], label=target_name)
plt.xlabel('Sepal length (cm)')
plt.ylabel('Sepal width (cm)')
plt.legend()
plt.title('Iris Sepal Length vs Width')
plt.show()

## Train/Test Split and Model Training

In [None]:
X_train, X_test, y_train, y_test = train_test_split(
    df[iris.feature_names], df['target'], test_size=0.2, random_state=42)
clf = RandomForestClassifier(random_state=42)
clf.fit(X_train, y_train)
y_pred = clf.predict(X_test)
print('Accuracy:', accuracy_score(y_test, y_pred))