## What is this notebook about?

Here, we analyse the sociodemographic information of the study participans. 

The numbers calculated here and other notebooks will be stored under the filepath indicated by the variable `data_reports_path` for future reference.

In [1]:
# Some imports to get things started
import sys
import os
import pandas as pd
import numpy as np
import warnings
warnings.filterwarnings('ignore')

sys.path.insert(1, os.path.abspath('../'))
from utils import save_descriptive_stats, save_variables
from pathlib import Path

In [2]:
# Load the questionnaire answers 
survey_info = pd.read_excel(Path('../data/survey.xlsx'))

# Where to save numbers from the analysis
data_reports_fp = Path('../reports/numbers.dat')

In [3]:
# Save descriptive statistics about participant age
save_descriptive_stats(Path(data_reports_fp),'age',survey_info['age'].values)

In [4]:
# Save frequency of each indicated gender in the sample
gender_counts = survey_info['gender'].value_counts()
for key in gender_counts.keys():
    save_variables(Path(data_reports_fp),f'gender_{key}',gender_counts[key])

In [5]:
# Save status of education 
higher_education = ['Bachelor (or comparable)','Master (or comparable)','Doctoral degree','Bachelor (or equivalent)','Master (or equivalent)']
higher_education_count = len(survey_info[survey_info.education.isin(higher_education)])
save_variables(Path(data_reports_fp),f'higher_education',higher_education_count)

In [6]:
# Save status of employment
employment_counts = survey_info['employed'].value_counts()
for key in employment_counts.keys():
    save_variables(Path(data_reports_fp),f'employed_{key}',employment_counts[key])