In [1]:
import warnings
warnings.filterwarnings('ignore')

import pandas as pd

# Creating a DataFrame
data = {'Customer_ID': [101, 102, 103, 101, 104, 102, 101, 105, 102, 103],
        'Purchase_Amount': [200, 150, 180, 220, 300, 200, 100, 400, 250, 300]}

df = pd.DataFrame(data)

# Grouping by Customer_ID and calculating total purchases
total_purchases = df.groupby('Customer_ID')['Purchase_Amount'].sum().reset_index()

# Finding the top 3 frequent customers
top_customers = total_purchases.sort_values(by='Purchase_Amount', ascending=False).head(3)

print("Total Purchases per Customer:")
print(total_purchases)
print("\nTop 3 Frequent Customers:")
print(top_customers)


Total Purchases per Customer:
   Customer_ID  Purchase_Amount
0          101              520
1          102              600
2          103              480
3          104              300
4          105              400

Top 3 Frequent Customers:
   Customer_ID  Purchase_Amount
1          102              600
0          101              520
2          103              480


In [2]:
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.linear_model import LinearRegression

# Creating a DataFrame
data = {'Square_Feet': [1500, 2000, 2500, 3000, 3500],
        'Price': [300000, 400000, 500000, 600000, 700000]}

df = pd.DataFrame(data)

# Splitting into features and target
X = df[['Square_Feet']]
y = df['Price']

# Training a Linear Regression Model
model = LinearRegression()
model.fit(X, y)

# Predicting for test data
test_data = [[1800], [2800]]
predictions = model.predict(test_data)

print("Predicted Prices:")
print(predictions)

Predicted Prices:
[360000. 560000.]


In [3]:
import pandas as pd

# Creating a DataFrame
data = {'Category': ['A', 'B', 'C', 'A', 'D', 'B', 'A', 'E', 'B', 'C', 'C', 'A'],
        'Value': [10, 15, 20, 30, 25, 18, 22, 40, 35, 50, 45, 15]}

df = pd.DataFrame(data)

# Counting occurrences per category
category_counts = df.groupby('Category').size().reset_index(name='Count')

# Finding the top 3 most frequent categories
top_categories = category_counts.sort_values(by='Count', ascending=False).head(3)

# Printing results
print("Total Occurrences per Category:")
print(category_counts)
print("\nTop 3 Frequent Categories:")
print(top_categories)


Total Occurrences per Category:
  Category  Count
0        A      4
1        B      3
2        C      3
3        D      1
4        E      1

Top 3 Frequent Categories:
  Category  Count
0        A      4
1        B      3
2        C      3


In [4]:
import pandas as pd

# Creating a DataFrame
data = {'Name': ['Alice', 'Bob', 'Charlie', 'David', 'Eve'],
        'Age': [25, 30, None, 35, None]}

df = pd.DataFrame(data)

# Display original data
print("Original Data:")
print(df)

# Replacing missing values with mean
df['Age'].fillna(df['Age'].mean(), inplace=True)

# Display updated data
print("\nData after Imputation:")
print(df)


Original Data:
      Name   Age
0    Alice  25.0
1      Bob  30.0
2  Charlie   NaN
3    David  35.0
4      Eve   NaN

Data after Imputation:
      Name   Age
0    Alice  25.0
1      Bob  30.0
2  Charlie  30.0
3    David  35.0
4      Eve  30.0


In [5]:
from sklearn.linear_model import LinearRegression

# Creating a DataFrame
data = {'Experience': [1, 2, 3, 4, 5], 
        'Salary': [30000, 35000, 40000, 45000, 50000]}
df = pd.DataFrame(data)

# Splitting into X and y
X = df[['Experience']]
y = df['Salary']

# Training a Linear Regression Model
model = LinearRegression()
model.fit(X, y)

# Predicting salary for 6 years of experience
predicted_salary = model.predict([[6]])
print(f"Predicted Salary for 6 years of experience: ${predicted_salary[0]:.2f}")

Predicted Salary for 6 years of experience: $55000.00
