In [None]:
%pip install numpy
%pip install pandas
%pip install matplotlib

### Step 1: Loading Data with pandas

Først vil vi indlæse vores datasæt ved hjælp af pandas, som giver en effektiv og intuitiv ramme til håndtering af tabulære data.

In [None]:
import pandas as pd

# Indlæse data fra en CSV-fil
data = pd.read_csv('sales_data.csv')
print(data)

### Step 2: Data Analysis with pandas

Herefter vil vi udføre nogle grundlæggende dataanalyser, som at beregne totalt salg og gennemsnitspris.

In [29]:
# Beregn totalt salg
data['Total Sales'] = data['Price'] * data['Units Sold']
print("Total sales for each product:\n", data[['Product', 'Total Sales']])

# Beregn gennemsnitsprisen
average_price = data['Price'].mean()
print("Average price of products:", average_price)


Total sales for each product:
      Product  Total Sales
0  Product A          300
1  Product B         1200
2  Product C         1350
3  Product D         1000
Average price of products: 35.0


### Step 3: Visualization with Matplotlib

Endelig vil vi visualisere disse data ved hjælp af Matplotlib for at vise salget og antallet af solgte enheder.

In [None]:
import matplotlib.pyplot as plt

# Oprette et stolpediagram for salget
plt.figure(figsize=(10, 5))
plt.bar(data['Product'], data['Total Sales'], color='blue')
plt.title('Total Sales per Product')
plt.xlabel('Product')
plt.ylabel('Total Sales')
plt.show()

# Oprette et cirkeldiagram for andelen af solgte enheder
plt.figure(figsize=(7, 7))
plt.pie(data['Units Sold'], labels=data['Product'], autopct='%1.1f%%')
plt.title('Percentage of Units Sold by Product')
plt.show()


### Step 4: Sammenligning af Salg og Units Sold med Stacked Bar Chart
Dette eksempel kombinerer information om salg og antal solgte enheder i et enkelt visualiseringslag.

In [None]:
# Tilføj en ny kolonne for total salg
data['Total Sales'] = data['Price'] * data['Units Sold']

# Stacked bar chart
plt.figure(figsize=(10, 6))
plt.bar(data['Product'], data['Units Sold'], label='Units Sold')
plt.bar(data['Product'], data['Total Sales'], bottom=data['Units Sold'], label='Total Sales', alpha=0.7)
plt.title('Comparison of Units Sold and Total Sales per Product')
plt.xlabel('Product')
plt.ylabel('Units and Total Sales')
plt.legend()
plt.show()


In [34]:
import pandas as pd

# Indlæse data
data = pd.read_csv('sales_data.csv')

print("--------------------------------------------------------------------------------------------")

# Beregn totalt salg
data['Total Sales'] = data['Price'] * data['Units Sold']
print("Total sales for each product:\n", data[['Product', 'Total Sales']])

print("--------------------------------------------------------------------------------------------")

# Beregn gennemsnitsprisen
average_price = data['Price'].mean()
print("Average price of products:", average_price)

print("--------------------------------------------------------------------------------------------")

# Beregn maksimum og minimum salg
max_sales = data['Total Sales'].max()
min_sales = data['Total Sales'].min()
print("Maximum sales amount:", max_sales)
print("Minimum sales amount:", min_sales)

print("--------------------------------------------------------------------------------------------")

# Beregn den samlede indkomst
total_revenue = data['Total Sales'].sum()
print("Total revenue from all products:", total_revenue)

print("--------------------------------------------------------------------------------------------")

# Beregn salg pr. kategori
sales_per_category = data.groupby('Category')['Total Sales'].sum()
print("Total sales per category:\n", sales_per_category)

print("--------------------------------------------------------------------------------------------")

# Beregn gennemsnitlig profit margin pr. kategori
average_profit_margin_per_category = data.groupby('Category')['Profit Margin'].mean()
print("Average profit margin per category:\n", average_profit_margin_per_category)

print("--------------------------------------------------------------------------------------------")

# Beregn antal solgte enheder pr. kategori
units_sold_per_category = data.groupby('Category')['Units Sold'].sum()
print("Total units sold per category:\n", units_sold_per_category)

print("--------------------------------------------------------------------------------------------")

# Identificer det bedst sælgende produkt
best_selling_product = data.loc[data['Units Sold'].idxmax()]
print("Best selling product details:\n", best_selling_product)


--------------------------------------------------------------------------------------------
Total sales for each product:
      Product  Total Sales
0  Product A          300
1  Product B         1200
2  Product C         1350
3  Product D         1000
--------------------------------------------------------------------------------------------
Average price of products: 35.0
--------------------------------------------------------------------------------------------
Maximum sales amount: 1350
Minimum sales amount: 300
--------------------------------------------------------------------------------------------
Total revenue from all products: 3850
--------------------------------------------------------------------------------------------
Total sales per category:
 Category
Clothing       1200
Electronics    1650
Home Goods     1000
Name: Total Sales, dtype: int64
--------------------------------------------------------------------------------------------
Average profit margin per cate