### Handling Unstructured Data with Python
**Description**: Extract structured data from unstructured text using Python.

**Steps**:
1. Load and analyze an unstructured text document.
2. Extract information using regex.

In [1]:
import re

# Step 1: Sample unstructured text (e.g., medical notes)
text = """
Patient John Doe, aged 45, visited on 2025-05-20 complaining of headache and fever.
Contact: 555-123-4567. Email: john.doe@example.com.
Next appointment: 2025-06-15.
"""

# Step 2: Extract structured data using regex

# Extract name (simple example: assume "Patient <Name>,")
name_match = re.search(r"Patient\s([A-Za-z\s]+),", text)
name = name_match.group(1) if name_match else "Not found"

# Extract age
age_match = re.search(r"aged\s(\d+)", text)
age = int(age_match.group(1)) if age_match else None

# Extract dates (YYYY-MM-DD)
dates = re.findall(r"\d{4}-\d{2}-\d{2}", text)

# Extract phone number (pattern: xxx-xxx-xxxx)
phone_match = re.search(r"\d{3}-\d{3}-\d{4}", text)
phone = phone_match.group(0) if phone_match else "Not found"

# Extract email
email_match = re.search(r"[\w\.-]+@[\w\.-]+", text)
email = email_match.group(0) if email_match else "Not found"

# Output extracted info
print("Extracted Information:")
print(f"Name: {name}")
print(f"Age: {age}")
print(f"Dates: {dates}")
print(f"Phone: {phone}")
print(f"Email: {email}")

Extracted Information:
Name: John Doe
Age: 45
Dates: ['2025-05-20', '2025-06-15']
Phone: 555-123-4567
Email: john.doe@example.com.
