In [None]:
#Libraries
import pandas as pd
from sklearn.preprocessing import StandardScaler
import matplotlib.pyplot as plt

In [None]:
# Data collection
dataset = pd.read_excel("dataset/AI On-Campus Research Survey (Responses).xlsx", engine='openpyxl')

In [None]:
# Handling columns we don't need
dataset = dataset.drop(['Timestamp'], axis = 1)

In [None]:
# Rename columns
dataset.rename(columns={
    'On a scale from 1 to 5, how would you rate your knowledge and understanding of Artificial Intelligence (AI)?': 'Knowledge_AI',
    'On a scale from 1 to 5, how often do you use Artificial Intelligence (AI) for personal use?': 'Personal_use_AI',
    'On a scale from 1 to 5, how often do you use Artificial Intelligence (AI) for school-related tasks?': 'School_use_AI',
    'On a scale from 1 to 5, how interested are you in pursuing a career in Artificial Intelligence?': 'Interest_AI_Career'
}, inplace=True)

In [None]:
# Top rows of the dataset 
dataset.head()

In [None]:
# Data types
dataset.info()

In [None]:
# Identifying null values
dataset.isnull().sum()

In [None]:
# Selecting features for outlier detection
outlier_features = dataset[['Knowledge_AI', 'Personal_use_AI', 'School_use_AI', 'Interest_AI_Career']]

# Standardize the data using Z-Score
scaler = StandardScaler()
standardized_features = scaler.fit_transform(outlier_features)

# Z-Score Outlier Detection
z_scores = pd.DataFrame(standardized_features, columns=outlier_features.columns)
outliers_zscore = z_scores[(z_scores.abs() > 3).any(axis=1)]

# Display the results
print("Z-Score Outliers:")
print(outliers_zscore)

In [None]:
# Vizualizimi sipas tipeve të dhënave
plt.figure(figsize=(12, 8))

# Numerical columns
numerical_columns = ['Knowledge_AI', 'Personal_use_AI', 'School_use_AI', 'Interest_AI_Career']

for i, column in enumerate(numerical_columns, 1):
    plt.subplot(2, 2, i)
    plt.hist(dataset[column], bins=30, color='skyblue', edgecolor='black')
    plt.title(f'Histogram of {column}')
    plt.xlabel(column)
    plt.ylabel('Frequency')

plt.tight_layout()
plt.show()