# 🧪 AutoML Exploration in Databricks
This notebook demonstrates how to explore a dataset and run AutoML inside Databricks using Python.

In [None]:
# Import necessary libraries
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns

# Spark session is usually available by default in Databricks as 'spark'
df = spark.read.format("delta").load("/mnt/delta/training_data")
df.show(5)

In [None]:
# Convert Spark DataFrame to Pandas for visualization (if dataset is small)
pdf = df.toPandas()

# Basic EDA
pdf.describe()

In [None]:
# Visualizing correlations
plt.figure(figsize=(10, 6))
sns.heatmap(pdf.corr(numeric_only=True), annot=True, cmap='coolwarm')
plt.title("Feature Correlation Heatmap")
plt.show()

## 🚀 Launching AutoML

In [None]:
import databricks.automl

# Launch AutoML
summary = databricks.automl.classify(df, target_col='target', timeout_minutes=15)

# View the best trial
summary.best_trial