# Pandas Data Processing Commands (SQL Equivalents)

This notebook lists pandas commands that correspond to common SQL operations.

## 1. Import Pandas

In [None]:
import pandas as pd

## 2. Read Data from CSV

In [None]:
df = pd.read_csv("input.csv")

## 3. Inspect Data

In [None]:
df.head()

df.info()

## 4. Select Columns (SELECT)

In [None]:
df[["col1", "col2"]]

## 5. Filter Rows (WHERE)

In [None]:
df[df["col"] > 0]

## 6. Create Columns or Expressions

In [None]:
df["new_col"] = df["col1"] + df["col2"]

## 7. Rename Columns (AS)

In [None]:
df = df.rename(columns={"old_name": "new_name"})

## 8. Sort Values (ORDER BY)

In [None]:
df.sort_values("col")

## 9. Distinct Values (DISTINCT)

In [None]:
df["col"].drop_duplicates()

df.drop_duplicates()

## 10. Group and Aggregate (GROUP BY)

In [None]:
df.groupby("key").agg({"value": "sum"})

## 11. Filter Aggregated Data (HAVING)

In [None]:
grouped = df.groupby("key")["value"].sum()
filtered = grouped[grouped > 100]

## 12. Join DataFrames (JOIN)

In [None]:
df1.merge(df2, on="key", how="inner")

## 13. Union DataFrames (UNION)

In [None]:
pd.concat([df1, df2], ignore_index=True)

## 14. Limit Rows (LIMIT)

In [None]:
df.head(10)

## 15. Handle Missing Values

In [None]:
df.fillna(0)

df.dropna()

## 16. Save to CSV

In [None]:
df.to_csv("output.csv", index=False)