In [3]:
import pandas as pd
import numpy as np

In [4]:
#can run this if working in the same folder as the data
def read_data(survey_section, discipline, dataset):
    ''' Loads UCUES datasets present in the Data Mural Project GitHub Data Folder and returns the dataset as a pandas
    dataframe
    
    Params:
        survey_section  str, Shortened section name, ex: Satis 
        discipline    str, Shortened discipline name, ex: Hum
        dataset    int, the sub-dataset from the specified survey section 
    '''
    #Creates the path for where the file is located in the local environment
    file_path = "{}_data_{}_{}.csv".format(survey_section, discipline, dataset)
    DF = pd.read_csv(file_path, encoding='utf-16le', sep = '\t')
    return DF

In [5]:
def read_data_from_file_path(file_path, UCUES_dataset, survey_section, discipline, dataset):
    ''' Loads UCUES datasets present in the Data Mural Project GitHub Data Folder and returns the dataset as a pandas
    dataframe
    
    Params:
        file_path     str, file_path to the dataset on your local environment, ex: /Users/omarramos/Documents/Data_Mural_Project/Data
        UCUES_dataset   str, name of the UCUES survey section and sub-dataset number, ex: Satisfaction-1
        survey_section  str, Shortened section name, ex: Satis 
        discipline    str, Shortened discipline name, ex: Hum
        dataset    int, the sub-dataset from the specified survey section 
    '''
    #Creates the path for where the file is located in the local environment
    file_path = "{}/Data/UCUES-{}/{}_data_{}_{}.csv".format(file_path, UCUES_dataset,survey_section, discipline, dataset)
    DF = pd.read_csv(file_path, encoding='utf-16le', sep = '\t')
    return DF

In [6]:
#read_data("Satis", "Arts", 1)
read_data_from_file_path("/Users/emilylopez/Desktop/data_mural/data_mural_proj","Satisfaction-1", "Satis", "Arts", 1).head()

Unnamed: 0,Label1,Pivot Field Values,Calculation1,Total
0,Top campus administrators are genuinely commit...,6,17%,27
1,"Knowing what I know now, I would still choose ...",6,31%,50
2,I feel valued as an individual at this institu...,6,14%,22
3,I feel that I belong at this university,6,19%,31
4,Faculty are genuinely committed to promoting r...,6,27%,42


In [7]:
# example for how to use the function to open datasets for different disciplines for the same section
disciplines = ["Arts", "Hum", "Life", "Eng", "Health", "Phys", "Prof", "Social", "Undec"]
dataset = 1
survey_section = "Satis"
file_path = "/Users/emilylopez/Desktop/data_mural/data_mural_proj"
UCUES_dataset = "Satisfaction-1"

array_dfs = []
for discipline in disciplines:
    df = read_data_from_file_path(file_path, UCUES_dataset, survey_section, discipline, dataset)
    df[discipline] = [discipline for i in range(len(df))]
    array_dfs.append(df)

## Importting Datasets with different file notation

**E.g. Camp_Cli_data_Arts 2.csv**

***Data/UCUES-Camp-Cli-1/Camp_Cli_data_Arts 2.csv***

***UPDATE:*** Dont think we need this function since the datasets were renamed

In [8]:
def read_data_from_file_path(file_path, UCUES_dataset, survey_section, discipline_dataset):
    ''' Loads UCUES datasets present in the Data Mural Project GitHub Data Folder and returns the dataset as a pandas
    dataframe
    
    Params:
        file_path     str, file_path to the dataset on your local environment, ex: /Users/omarramos/Documents/Data_Mural_Project/Data
        UCUES_dataset   str, name of the UCUES survey section and sub-dataset number, ex: Camp-Cli-1
        survey_section  str, Shortened section name, ex: Camp_Cli
        discipline with dataseet   str, Shortened discipline name and the sub-dataset from 
                                    the specified survey section , ex: Arts2
    
    '''
    #Creates the path for where the file is located in the local environment
    file_path = "{}/Data/UCUES-{}/{}_data_{}.csv".format(file_path, UCUES_dataset,survey_section, discipline_dataset)
    DF = pd.read_csv(file_path, encoding='utf-16le', sep = '\t')
    return DF

#### Testing with Data/UCUES-Camp-Cli-1/Camp_Cli_data_Health_Clinical 2.csv

In [10]:
file_path = "/Users/emilylopez/Desktop/data_mural/data_mural_proj"
UCUES_dataset = "Camp-Cli-1"
survey_section = "Camp_Cli"
discipline_dataset = "Health_Clinical 2"

read_data_from_file_path(file_path, UCUES_dataset, survey_section, discipline_dataset)

Unnamed: 0,Label1,Pivot Field Values,Calculation1,Total
0,UC [CAMPUS] is a welcoming campus,6,5%,7
1,UC [CAMPUS] is a safe and secure campus,6,2%,3
2,"Overall, I feel comfortable with the climate f...",6,9%,13
3,"Overall, I feel comfortable with the climate f...",6,13%,19
4,"Overall, I feel comfortable with the campus cl...",6,26%,37
5,UC [CAMPUS] is a welcoming campus,5,36%,51
6,UC [CAMPUS] is a safe and secure campus,5,23%,32
7,"Overall, I feel comfortable with the climate f...",5,36%,51
8,"Overall, I feel comfortable with the climate f...",5,44%,62
9,"Overall, I feel comfortable with the campus cl...",5,45%,64
