# NumPy Data Analyzer

This notebook provides examples of how to use the classes and methods in the NumPy Data Analyzer project for data analysis and visualization.

In [1]:
import pandas as pd
import numpy as np
from src.data_processor import DataProcessor
from src.visualizer import DataVisualizer
from src.models import StatisticalModel
from src.utils import calculate_mean, calculate_median, calculate_std_dev

# Load the data
data_processor = DataProcessor()
data = data_processor.load_data('data/sample_data.csv')

# Clean the data
cleaned_data = data_processor.clean_data(data)

# Analyze the data
analysis_results = data_processor.analyze_data(cleaned_data)
print(analysis_results)


In [2]:
# Visualize the data
data_visualizer = DataVisualizer()

# Plot histogram
data_visualizer.plot_histogram(cleaned_data, 'column_name')

# Plot scatter
data_visualizer.plot_scatter(cleaned_data, 'column_x', 'column_y')

# Show correlation matrix
data_visualizer.show_correlation_matrix(cleaned_data)


In [3]:
# Fit a statistical model
model = StatisticalModel()
model.fit_model(cleaned_data)

# Make predictions
predictions = model.predict(new_data)
print(predictions)


In [4]:
# Calculate statistics
mean_value = calculate_mean(cleaned_data['column_name'])
median_value = calculate_median(cleaned_data['column_name'])
std_dev_value = calculate_std_dev(cleaned_data['column_name'])

print(f'Mean: {mean_value}, Median: {median_value}, Std Dev: {std_dev_value}')