In [6]:
import pandas as pd
from scipy.stats import shapiro

# Load the dataset into a pandas dataframe, skip the first column and the first row
data = pd.read_csv("dataset.csv", index_col=0, header=0)

data = data.drop(columns = ['Th'])

In [7]:
# Check for normality using the Shapiro-Wilk test for each column
for col in data.columns:
    stat, p = shapiro(data[col].dropna())
    print('Column {}: Statistics={:.3f}, p={:.3f}'.format(col, stat, p))

Column areia: Statistics=0.921, p=0.000
Column silte: Statistics=0.897, p=0.000
Column argila: Statistics=0.883, p=0.000
Column pH: Statistics=0.985, p=0.015
Column CTC: Statistics=0.668, p=0.000
Column COT: Statistics=0.799, p=0.000
Column Ba: Statistics=0.748, p=0.000
Column Cd: Statistics=0.487, p=0.000
Column Co: Statistics=0.830, p=0.000
Column Cr: Statistics=0.661, p=0.000
Column Cu: Statistics=0.788, p=0.000
Column Fe: Statistics=0.626, p=0.000
Column Mn: Statistics=0.765, p=0.000
Column Ni: Statistics=0.644, p=0.000
Column Pb: Statistics=0.847, p=0.000
Column Se: Statistics=0.791, p=0.000
Column Sb: Statistics=0.541, p=0.000
Column V: Statistics=0.711, p=0.000
Column Zn: Statistics=0.809, p=0.000
Column Sc: Statistics=0.787, p=0.000
Column La: Statistics=0.666, p=0.000
Column Ce: Statistics=0.709, p=0.000
Column Pr: Statistics=0.743, p=0.000
Column Nd: Statistics=0.705, p=0.000
Column Sm: Statistics=0.705, p=0.000
Column Eu: Statistics=0.652, p=0.000
Column LREE: Statistics=0.7

In [9]:
# Compute the Spearman correlation matrix
spearman_corr_matrix = data.corr(method="spearman")

spearman_corr_matrix

Unnamed: 0,areia,silte,argila,pH,CTC,COT,Ba,Cd,Co,Cr,...,Gd,Tb,Dy,Er,Ho,Yb,Lu,HREE,LREE/HREE,REE
areia,1.0,-0.824568,-0.874957,-0.281815,-0.743712,-0.514033,-0.700593,-0.511723,-0.478724,-0.632388,...,-0.708838,-0.715288,-0.597524,-0.720807,-0.690002,-0.769846,-0.645259,-0.717982,0.164965,-0.707986
silte,-0.824568,1.0,0.495841,0.346087,0.636606,0.348263,0.759904,0.476805,0.5195,0.437928,...,0.655549,0.625133,0.519188,0.617055,0.482912,0.624798,0.523758,0.642566,-0.172585,0.636153
argila,-0.874957,0.495841,1.0,0.202883,0.679696,0.521426,0.529898,0.415194,0.337983,0.623249,...,0.610473,0.654187,0.550468,0.670259,0.702015,0.739699,0.61332,0.641865,-0.141218,0.632385
pH,-0.281815,0.346087,0.202883,1.0,0.432198,-0.087005,0.442137,0.167746,0.507428,0.343561,...,0.518645,0.493778,0.43629,0.510861,0.43801,0.437407,0.504827,0.516488,-0.321427,0.436054
CTC,-0.743712,0.636606,0.679696,0.432198,1.0,0.650283,0.651417,0.445437,0.648794,0.578505,...,0.817249,0.80537,0.675931,0.80432,0.680991,0.796264,0.797228,0.801898,-0.415805,0.729326
COT,-0.514033,0.348263,0.521426,-0.087005,0.650283,1.0,0.243907,0.353592,0.077688,0.233248,...,0.280816,0.309843,0.230304,0.272111,0.283002,0.380017,0.253463,0.26697,0.050291,0.335318
Ba,-0.700593,0.759904,0.529898,0.442137,0.651417,0.243907,1.0,0.425713,0.582233,0.539258,...,0.776733,0.73566,0.626822,0.699361,0.537203,0.701636,0.541991,0.755268,-0.214591,0.737434
Cd,-0.511723,0.476805,0.415194,0.167746,0.445437,0.353592,0.425713,1.0,0.168229,0.416772,...,0.37586,0.428515,0.374374,0.397545,0.404024,0.48131,0.342775,0.412508,-0.027304,0.416466
Co,-0.478724,0.5195,0.337983,0.507428,0.648794,0.077688,0.582233,0.168229,1.0,0.625138,...,0.711698,0.695924,0.649786,0.731305,0.710692,0.638059,0.801086,0.709396,-0.534536,0.596279
Cr,-0.632388,0.437928,0.623249,0.343561,0.578505,0.233248,0.539258,0.416772,0.625138,1.0,...,0.567828,0.568756,0.446644,0.597293,0.59423,0.626219,0.533713,0.579089,-0.439705,0.46895


In [10]:
# Save the correlation matrix to a new CSV file
spearman_corr_matrix.to_csv("spearman_corr_matrix.csv")