In [None]:
import os
import sys

def change_working_directory(new_dir):
    """
    Changes the current working directory to the specified path.

    Args:
        new_dir (str): The new path to the working directory.

    Raises:
        FileNotFoundError: If the specified directory is not found.
        PermissionError: If there are insufficient permissions to access the directory.
        Exception: For any other exceptions that occur.
    """
    try:
        os.chdir(new_dir)
        print(f"Current working directory changed to: {os.getcwd()}")
    except FileNotFoundError:
        print(f"Error: Directory '{new_dir}' not found.")
    except PermissionError:
        print(f"Error: Insufficient permissions to access '{new_dir}'.")
    except Exception as e:
        print(f"An error occurred: {e}")

sys.path.append("Q:/SANDBOX/PredictEstateShowcase_dev/src")
sys.path.append("Q:/SANDBOX/PredictEstateShowcase_dev/")
change_working_directory('Q:/SANDBOX/PredictEstateShowcase_dev/')


In [None]:
# Import libraries
import pandas as pd
import seaborn as sns
import matplotlib.pyplot as plt

# Path to the file
file_path = "../data/sample_data.csv"

# Load the data
df = pd.read_csv(file_path)

# Initial analysis
print(f"Data dimensions (rows, columns): {df.shape}")
print("Data types for each column:")
print(df.dtypes)
print("\nMissing values in each column:")
print(df.isnull().sum())

# Visualization of the distribution of a specific column
sns.histplot(df["column_name"], kde=True)
plt.title("Distribution of values in 'column_name'")
plt.xlabel("Values")
plt.ylabel("Frequency")
plt.show()

# Correlation matrix to understand relationships between numeric features
correlation_matrix = df.corr()
sns.heatmap(correlation_matrix, annot=True, cmap="coolwarm")
plt.title("Correlation Matrix")
plt.show()
