# Introduction to Pandas 🐼


## Install and Import

```bash
pip install pandas
```

In [None]:
import pandas as pd

## Creating a Series

In [None]:
data = [10, 20, 30, 40]
series = pd.Series(data)
print(series)


## Creating a DataFrame

In [None]:
data = {'Name': ['Alice', 'Bob', 'Charlie'], 'Age': [25, 30, 35], 'City': ['New York', 'Paris', 'London']}
df = pd.DataFrame(data)
print(df)


## Basic Operations

In [None]:
print(df['Name'])
print(df.describe())
print(df[df['Age'] > 28])


## Reading and Writing Data

In [None]:
df

In [None]:
df.to_csv('output.csv', index=False)
df2 = pd.read_csv('output.csv')
print(df2)

## Handling Missing Data

In [None]:
print(df.isnull().sum())
df.fillna(0, inplace=True)
df.dropna(inplace=True)


## Grouping and Aggregating

In [None]:
grouped = df.groupby('City')['Age'].mean()
print(grouped)


## Sorting Data

In [None]:
sorted_df = df.sort_values(by='Age', ascending=False)
print(sorted_df)


## Visualization with Pandas

In [None]:
import matplotlib.pyplot as plt

data = {'Year': [2020, 2021, 2022], 'Sales': [100, 150, 200]}
df = pd.DataFrame(data)

df.plot(x='Year', y='Sales', kind='line')
plt.show()

df.plot(x='Year', y='Sales', kind='bar')
plt.show()

df['Sales'].plot(kind='hist')
plt.show()


## Pandas Cheat Sheet

| Task | Command |
|------|----------|
| Create DataFrame | pd.DataFrame(data) |
| Read CSV | pd.read_csv('file.csv') |
| Write CSV | df.to_csv('file.csv') |
| View Data | df.head(), df.tail() |
| Info | df.info(), df.describe() |
| Select Column | df['column'] |
| Filter Rows | df[df['Age'] > 30] |
| Group Data | df.groupby('column') |
| Sort Data | df.sort_values('column') |
| Check Missing | df.isnull() |
| Fill Missing | df.fillna(value) |
| Drop Missing | df.dropna() |
| Plot Data | df.plot(kind='line') |