In [None]:
# Import necessary libraries
import numpy as np
import pandas as pd
import json
import xml.etree.ElementTree as ET
import sqlite3
import os

print("Libraries imported successfully!")


In [None]:
# Create a sample CSV file
csv_data = '''id,name,age,city,salary
1,John Smith,34,New York,75000
2,Sarah Johnson,28,San Francisco,82000
3,Michael Brown,45,Chicago,65000
4,Emily Davis,31,Boston,78000
5,Robert Wilson,39,Seattle,90000
'''

# Write to CSV file
with open('sample_data.csv', 'w') as f:
    f.write(csv_data)

# Read CSV with pandas
df_csv = pd.read_csv('sample_data.csv')
print("CSV Data:")
print(df_csv.head())
print("\nData Types:")
print(df_csv.dtypes)
print("\nBasic Statistics:")
print(df_csv.describe())


In [None]:
# Create sample JSON data
json_data = {
    "employees": [
        {
            "id": 1,
            "name": "John Smith",
            "details": {
                "age": 34,
                "position": "Software Engineer",
                "department": "Engineering",
                "skills": ["Python", "JavaScript", "Docker"]
            },
            "projects": [
                {"name": "Project A", "status": "Completed"},
                {"name": "Project B", "status": "In Progress"}
            ]
        },
        {
            "id": 2,
            "name": "Sarah Johnson",
            "details": {
                "age": 28,
                "position": "Data Scientist",
                "department": "Analytics",
                "skills": ["Python", "R", "SQL", "Machine Learning"]
            },
            "projects": [
                {"name": "Project C", "status": "In Progress"}
            ]
        }
    ],
    "company": "Tech Solutions Inc."
}

# Save to JSON file
with open('sample_data.json', 'w') as f:
    json.dump(json_data, f, indent=4)

# Read JSON file
with open('sample_data.json', 'r') as f:
    loaded_json = json.load(f)

print("JSON Data Structure:")
print(json.dumps(loaded_json, indent=2))

# Convert JSON to DataFrame
employees = pd.json_normalize(loaded_json['employees'])
print("\nEmployees DataFrame:")
print(employees)


In [None]:
# Create sample XML data
xml_data = '''<?xml version="1.0" encoding="UTF-8"?>
<bookstore>
  <book category="Fiction">
    <title>The Great Gatsby</title>
    <author>F. Scott Fitzgerald</author>
    <year>1925</year>
    <price>12.99</price>
  </book>
  <book category="Non-Fiction">
    <title>Sapiens: A Brief History of Humankind</title>
    <author>Yuval Noah Harari</author>
    <year>2011</year>
    <price>15.95</price>
  </book>
  <book category="Science Fiction">
    <title>Dune</title>
    <author>Frank Herbert</author>
    <year>1965</year>
    <price>10.50</price>
  </book>
</bookstore>
'''

# Write to XML file
with open('sample_data.xml', 'w') as f:
    f.write(xml_data)

# Parse XML
tree = ET.parse('sample_data.xml')
root = tree.getroot()

# Extract data from XML
books = []
for book in root.findall('book'):
    book_data = {
        'category': book.attrib.get('category', ''),
        'title': book.find('title').text if book.find('title') is not None else '',
        'author': book.find('author').text if book.find('author') is not None else '',
        'year': book.find('year').text if book.find('year') is not None else '',
        'price': book.find('price').text if book.find('price') is not None else ''
    }
    books.append(book_data)

# Convert to DataFrame
df_xml = pd.DataFrame(books)
print("XML Data as DataFrame:")
print(df_xml)


In [None]:
# Create SQLite database
conn = sqlite3.connect('sample_database.db')
cursor = conn.cursor()

# Create table
cursor.execute('''
CREATE TABLE IF NOT EXISTS employees (
    id INTEGER PRIMARY KEY,
    name TEXT NOT NULL,
    department TEXT NOT NULL,
    salary REAL,
    hire_date TEXT
)
''')

# Insert sample data
employees_data = [
    (1, 'John Smith', 'Engineering', 75000.00, '2020-03-15'),
    (2, 'Sarah Johnson', 'Analytics', 82000.00, '2019-11-10'),
    (3, 'Michael Brown', 'Marketing', 65000.00, '2018-06-22'),
    (4, 'Emily Davis', 'Engineering', 78000.00, '2021-01-05'),
    (5, 'Robert Wilson', 'Analytics', 90000.00, '2017-09-30')
]

cursor.executemany('''
INSERT OR REPLACE INTO employees (id, name, department, salary, hire_date)
VALUES (?, ?, ?, ?, ?)
''', employees_data)

# Commit changes
conn.commit()

# Query data
cursor.execute('SELECT * FROM employees')
rows = cursor.fetchall()

# Convert to DataFrame
df_sql = pd.DataFrame(rows, columns=['id', 'name', 'department', 'salary', 'hire_date'])
print("Database Query Results:")
print(df_sql)

# Close connection
conn.close()


In [None]:
'''
# Example of API data extraction using requests library
import requests

# GET request to an API
response = requests.get("https://api.example.com/data")

# Check if request was successful
if response.status_code == 200:
    # Parse JSON response
    data = response.json()
    
    # Convert to DataFrame
    df = pd.DataFrame(data)
    
    # Process and analyze data
    # ...

# POST request with parameters
params = {
    "key1": "value1",
    "key2": "value2"
}
response = requests.post("https://api.example.com/submit", json=params)

# Authentication example
headers = {
    "Authorization": "Bearer YOUR_API_TOKEN"
}
response = requests.get("https://api.example.com/protected", headers=headers)
'''

print("API extraction code examples ready for reference!")

# Simulated API response for demonstration
simulated_api_response = {
    "results": [
        {"id": 1, "name": "Product A", "category": "Electronics", "price": 499.99},
        {"id": 2, "name": "Product B", "category": "Clothing", "price": 29.99},
        {"id": 3, "name": "Product C", "category": "Home", "price": 149.99},
        {"id": 4, "name": "Product D", "category": "Electronics", "price": 999.99},
        {"id": 5, "name": "Product E", "category": "Clothing", "price": 59.99}
    ],
    "total": 5,
    "page": 1,
    "pages": 1
}

# Process the simulated API data
df_api = pd.DataFrame(simulated_api_response["results"])
print("Simulated API Data:")
print(df_api)
