In [1]:
import pandas as pd
import numpy as np

# Step 1: Create the DataFrame
data = {
    'First Name': ['Alice', 'Bob', 'Charlie', 'David'],
    'Age': [25, 30, 35, 40],
    'City': ['New York', 'San Francisco', 'Los Angeles', 'Chicago']
}
df = pd.DataFrame(data)

# 1. Rename column names using a function
df.rename(columns=lambda x: x.lower().replace(" ", "_"), inplace=True)

# 2. Print the first 3 rows of the DataFrame
print("First 3 rows of the DataFrame:")
print(df.head(3))

# 3. Find the mean age of the individuals
mean_age = df['age'].mean()
print("\nMean age of the individuals:", mean_age)

# 4. Select and print only the 'first_name' and 'city' columns
print("\nSelected columns (first_name and city):")
print(df[['first_name', 'city']])

# 5. Add a new column 'salary' with random salary values
np.random.seed(42)  # For reproducibility
df['salary'] = np.random.randint(50000, 100000, size=len(df))

# 6. Display summary statistics of the DataFrame
print("\nSummary statistics of the DataFrame:")
print(df.describe())

First 3 rows of the DataFrame:
  first_name  age           city
0      Alice   25       New York
1        Bob   30  San Francisco
2    Charlie   35    Los Angeles

Mean age of the individuals: 32.5

Selected columns (first_name and city):
  first_name           city
0      Alice       New York
1        Bob  San Francisco
2    Charlie    Los Angeles
3      David        Chicago

Summary statistics of the DataFrame:
             age        salary
count   4.000000      4.000000
mean   32.500000  74886.250000
std     6.454972  20247.671938
min    25.000000  50860.000000
25%    28.750000  62061.250000
50%    32.500000  76976.500000
75%    36.250000  89801.500000
max    40.000000  94732.000000


In [2]:
import pandas as pd

# Step 1: Create the DataFrame
data = {
    'Month': ['Jan', 'Feb', 'Mar', 'Apr'],
    'Sales': [5000, 6000, 7500, 8000],
    'Expenses': [3000, 3500, 4000, 4500]
}
sales_and_expenses = pd.DataFrame(data)

# Step 2: Calculate and display the maximum sales and expenses
max_sales = sales_and_expenses['Sales'].max()
max_expenses = sales_and_expenses['Expenses'].max()
print("Maximum Sales:", max_sales)
print("Maximum Expenses:", max_expenses)

# Step 3: Calculate and display the minimum sales and expenses
min_sales = sales_and_expenses['Sales'].min()
min_expenses = sales_and_expenses['Expenses'].min()
print("\nMinimum Sales:", min_sales)
print("Minimum Expenses:", min_expenses)

# Step 4: Calculate and display the average sales and expenses
avg_sales = sales_and_expenses['Sales'].mean()
avg_expenses = sales_and_expenses['Expenses'].mean()
print("\nAverage Sales:", avg_sales)
print("Average Expenses:", avg_expenses)

Maximum Sales: 8000
Maximum Expenses: 4500

Minimum Sales: 5000
Minimum Expenses: 3000

Average Sales: 6625.0
Average Expenses: 3750.0


In [3]:
import pandas as pd

# Step 1: Create the DataFrame
data = {
    'Category': ['Rent', 'Utilities', 'Groceries', 'Entertainment'],
    'January': [1200, 200, 300, 150],
    'February': [1300, 220, 320, 160],
    'March': [1400, 240, 330, 170],
    'April': [1500, 250, 350, 180]
}
expenses = pd.DataFrame(data)

# Set 'Category' as the index
expenses.set_index('Category', inplace=True)

# Step 2: Calculate and display the maximum expense for each category
max_expenses = expenses.max(axis=1)
print("Maximum expense for each category:")
print(max_expenses)

# Step 3: Calculate and display the minimum expense for each category
min_expenses = expenses.min(axis=1)
print("\nMinimum expense for each category:")
print(min_expenses)

# Step 4: Calculate and display the average expense for each category
avg_expenses = expenses.mean(axis=1)
print("\nAverage expense for each category:")
print(avg_expenses)

Maximum expense for each category:
Category
Rent             1500
Utilities         250
Groceries         350
Entertainment     180
dtype: int64

Minimum expense for each category:
Category
Rent             1200
Utilities         200
Groceries         300
Entertainment     150
dtype: int64

Average expense for each category:
Category
Rent             1350.0
Utilities         227.5
Groceries         325.0
Entertainment     165.0
dtype: float64
