# NumPy vs Python Lists: Performance & Usage Guide
This notebook demonstrates the difference between **Python lists** and **NumPy arrays**, their performance, memory usage, and various operations.

## 1. Python Lists vs NumPy Arrays (Performance Benchmark)

In [None]:
import numpy as np
import time

# Python list
size = 1_000_000
list1 = list(range(size))
list2 = list(range(size))

start = time.time()
result = [x + y for x, y in zip(list1, list2)]
end = time.time()
print("Python list addition time:", end - start)

# NumPy array
arr1 = np.array(list1)
arr2 = np.array(list2)

start = time.time()
result = arr1 + arr2  # Vectorized operation
end = time.time()
print("NumPy array addition time:", end - start)

## 2. Creating NumPy Arrays

In [None]:
import numpy as np

# Creating a 1D NumPy array
arr1 = np.array([1, 2, 3, 4, 5])
print(arr1)

# Creating a 2D NumPy array
arr2 = np.array([[1, 2, 3], [4, 5, 6]])
print(arr2)

# Checking type and shape
print("Type:", type(arr1))
print("Shape:", arr2.shape)

## 3. Memory Efficiency

In [None]:
import sys

list_data = list(range(1000))
numpy_data = np.array(list_data)

print("Python list size:", sys.getsizeof(list_data) * len(list_data), "bytes")
print("NumPy array size:", numpy_data.nbytes, "bytes")

## 4. Array Basics (Shape, Size, Dimensions, Data types)

In [None]:
np.zeros((3, 3))
np.ones((2, 4))
np.full((2, 2), 7)
np.eye(4)
np.arange(1, 10, 2)
np.linspace(0, 1, 5)

arr = np.array([[10, 20, 30], [40, 50, 60]])
print("Shape:", arr.shape)
print("Size:", arr.size)
print("Dimensions:", arr.ndim)
print("Data type:", arr.dtype)

## 5. Reshaping & Flattening

In [None]:
arr = np.array([[1, 2, 3], [4, 5, 6]])
print(arr.shape)

reshaped = arr.reshape((3, 2))
print(reshaped)

flattened = arr.flatten()
print(flattened)

## 6. Indexing, Slicing, Masking, and Fancy Indexing

In [None]:
arr = np.array([10, 20, 30, 40, 50])
print(arr[1:4])
print(arr[:3])
print(arr[::2])

sliced = arr[1:4]
sliced[0] = 999
print(arr)

idx = [0, 2, 4]
print(arr[idx])

mask = arr > 25
print(arr[mask])

## 7. Operations (Vectorization & Broadcasting)

In [None]:
arr = np.array([1, 2, 3, 4, 5])
print(arr ** 2)
print(arr + 10)

arr1 = np.array([[1, 2, 3], [4, 5, 6]])
arr2 = np.array([1, 2, 3])
print(arr1 + arr2)

## 8. Statistics & Normalization

In [None]:
data = np.array([[10, 20, 30],
                 [15, 25, 35],
                 [20, 30, 40],
                 [25, 35, 45],
                 [30, 40, 50]])

mean = data.mean(axis=0)
std = data.std(axis=0)

normalized_data = (data - mean) / std
print(normalized_data)

## 9. Useful NumPy Functions Cheat-Sheet

In [None]:
np.mean(arr)
np.std(arr)
np.var(arr)
np.min(arr)
np.max(arr)
np.sum(arr)
np.prod(arr)
np.median(arr)
np.percentile(arr, 50)
np.argmin(arr)
np.argmax(arr)
np.corrcoef(arr1, arr2)
np.unique(arr)
np.diff(arr)
np.cumsum(arr)
np.linspace(0, 10, 5)
np.log(arr)
np.exp(arr)

# ✅ Conclusion
- Python lists are **slower** and use more memory for numerical operations.
- NumPy arrays are **faster, memory-efficient, and support vectorized & broadcasting operations**.
- NumPy provides a rich set of tools for data analysis, statistics, and machine learning preparation.