In [None]:
import numpy as np

file_path = '/content/supermarket_sales.csv'
data = np.genfromtxt(file_path, delimiter=',', dtype=str, skip_header=1)

In [7]:
product_categories = data[:, 5]
unit_prices = data[:, 6].astype(float)
quantities = data[:, 7].astype(int)
total_sales = data[:, 9].astype(float)
gross_incomes = data[:, 15].astype(float)

print("--- Data Loading Complete ---")
print(f"Total records loaded: {len(data)}\n")

--- Data Loading Complete ---
Total records loaded: 1000



In [8]:
overall_total_sales = np.sum(total_sales)
average_sales = np.mean(total_sales)

print("--- Array Operations ---")
print(f"Overall Total Sales: ${overall_total_sales:.2f}")
print(f"Average Sale Amount: ${average_sales:.2f}\n")

--- Array Operations ---
Overall Total Sales: $322966.75
Average Sale Amount: $322.97



In [11]:
print("--- Indexing and Slicing ---")
# Slicing the first 5 records
print(f"First 5 Product Categories: {product_categories[:5]}")
print(f"First 5 Quantities Sold: {quantities[:5]}")
high_volume_mask = quantities >= 8
high_volume_sales = total_sales[high_volume_mask]
print(f"Number of transactions where 8 or more items were sold: {len(high_volume_sales)}\n")

--- Indexing and Slicing ---
First 5 Product Categories: ['Health and beauty' 'Electronic accessories' 'Home and lifestyle'
 'Health and beauty' 'Sports and travel']
First 5 Quantities Sold: [7 5 7 8 7]
Number of transactions where 8 or more items were sold: 296



In [10]:
print("--- Statistical Operations on Gross Income ---")
print(f"Mean Gross Income: ${np.mean(gross_incomes):.2f}")
print(f"Median Gross Income: ${np.median(gross_incomes):.2f}")
print(f"Variance of Gross Income: ${np.var(gross_incomes):.2f}")
print(f"Standard Deviation of Gross Income: ${np.std(gross_incomes):.2f}\n")

--- Statistical Operations on Gross Income ---
Mean Gross Income: $15.38
Median Gross Income: $12.09
Variance of Gross Income: $136.96
Standard Deviation of Gross Income: $11.70



In [12]:
calculated_revenue = quantities * unit_prices

print("--- Broadcasting & Vectorized Computation ---")
print("Calculated Revenue (Quantity * Unit Price) for the first 5 transactions:")
print(calculated_revenue[:5])
print("\nComparing calculated revenue to recorded 'Total' for the first transaction:")
print(f"Calculated: ${calculated_revenue[0]:.2f}")
print(f"Recorded Total (Includes Tax): ${total_sales[0]:.2f}\n")

--- Broadcasting & Vectorized Computation ---
Calculated Revenue (Quantity * Unit Price) for the first 5 transactions:
[522.83  76.4  324.31 465.76 604.17]

Comparing calculated revenue to recorded 'Total' for the first transaction:
Calculated: $522.83
Recorded Total (Includes Tax): $548.97



In [13]:
print("--- Interpretation of Statistical Results ---")
print(f"1. Central Tendency: The average transaction generates roughly ${np.mean(total_sales):.2f} in total sales, and the median gross income is ${np.median(gross_incomes):.2f}, showing a baseline for expected profitability per transaction.")
print(f"2. Dispersion: The standard deviation of gross income is ${np.std(gross_incomes):.2f}. This relatively low standard deviation suggests that the profit margins per transaction are quite consistent across the dataset.")
print("3. Business Impact: Using vectorized multiplication reveals the pre-tax base revenue efficiently, demonstrating how NumPy scales calculations across thousands of rows instantly.")

--- Interpretation of Statistical Results ---
1. Central Tendency: The average transaction generates roughly $322.97 in total sales, and the median gross income is $12.09, showing a baseline for expected profitability per transaction.
2. Dispersion: The standard deviation of gross income is $11.70. This relatively low standard deviation suggests that the profit margins per transaction are quite consistent across the dataset.
3. Business Impact: Using vectorized multiplication reveals the pre-tax base revenue efficiently, demonstrating how NumPy scales calculations across thousands of rows instantly.
