# About the notebook
The purpose of this Jupyter Notebook is to average the extracted features for each patient (3 samples were obtained for each patient)

# 01 - Loading dependencies
In this notebook, before running any code, there are several libraries and modules that need to be imported to ensure that the notebook runs smoothly. These libraries and modules contain pre-written code that performs specific tasks, such as reading and processing images, defining the UNET model, and training the model.

In [5]:
import pandas as pd
from pathlib import Path

def convert_file_of_features_to_file_of_features_average(file_path):
    file_path = Path(file_path)
    # Read the data file
    data = pd.read_excel(file_path)

    # Extract the first 9 characters of each ID
    data['shortID'] = data['file_id'].str[:9]

    # Verify that there are exactly 3 fields per patient
    if not all(data['shortID'].value_counts() == 3):
        raise ValueError("Exactly 3 fields per patient are required")

    # Select only numeric columns for averaging
    numeric_columns = data.select_dtypes(include='number').columns

    # Calculate the average of the values by ID
    averaged_data = data.groupby('shortID')[numeric_columns].mean().reset_index()

    # Merge averaged data back with shortID
    averaged_data = pd.merge(data[['shortID']].drop_duplicates(), averaged_data, on='shortID', how='left')

    # Replace the 'shortID' column with 'ID'
    averaged_data.rename(columns={'shortID': 'ID'}, inplace=True)

    # Generate the output file name
    output_file_name = file_path.with_stem(file_path.stem + '_averaged_data')

    # Save the result to a new Excel file
    averaged_data.to_excel(output_file_name, index=False)
    
    print(f'The file has been saved as {output_file_name}')


In [13]:
file_path = r"C:\Users\paulh\OneDrive\Documentos\PAPER\Journal\2024_Psoriasis\analysis_dataset\Tratamiento\Claudina_4\group_1.xlsx"
convert_file_of_features_to_file_of_features_average(file_path)

The file has been saved as C:\Users\paulh\OneDrive\Documentos\PAPER\Journal\2024_Psoriasis\analysis_dataset\Tratamiento\Claudina_4\group_1_averaged_data.xlsx
