In [1]:
from analysis_functions import do_rep_list, do_preprocessing, data_preparer, saver, opener

In [2]:
def make_X_y(path_import, path_export, posfix):
    """
    Function to load data from the 'path_import' folder,
    prepare it for learning and save it in the 'path_export' folder
    with 'postfix' in the end of the names.

    Parameters
    ----------

    path_import : str
        Path to the folder with the data.
    path_export : str
        Path to the folder where the data will be saved.
    posfix : str
        Postfix for the data names.
    """
    files = do_rep_list(path_import)
    print(f'Count of files: {len(files)}')
    arrays = do_preprocessing(files, path_import)
    (
        X_stress_components_new,
        X_strain_components_new,
        y_stress_components_new,
        y_strain_components_new,
    ) = data_preparer(files, arrays)
    print(f"Arrays shapes: {X_stress_components_new.shape}, " \
    f"{X_strain_components_new.shape}, " \
    f"{y_stress_components_new.shape}, " \
    f"{y_strain_components_new.shape}")
    saver(X_stress_components_new, f'X_stress_components_{posfix}', path_import=path_export)
    saver(X_strain_components_new, f'X_strain_components_{posfix}', path_import=path_export)
    saver(y_stress_components_new, f'y_stress_components_{posfix}', path_import=path_export)
    saver(y_strain_components_new, f'y_strain_components_{posfix}', path_import=path_export)
    

In [3]:
make_X_y("aisi_files", "resourses", "aisi")

Count of files: 50
..................................................
Arrays shapes: (3, 50, 5), (3, 50, 5), (3, 50, 20), (3, 50, 20)
saved in resourses/X_stress_components_aisi.pkl
saved in resourses/X_strain_components_aisi.pkl
saved in resourses/y_stress_components_aisi.pkl
saved in resourses/y_strain_components_aisi.pkl


In [3]:
def make_X_y_from_list(path_import_list, path_export, postfix):
    files_list = []
    arrays_list = []
    for path_import in path_import_list:
        print(f"Processing {path_import}")
        files = do_rep_list(path_import)
        files_list += files
        print(f"Count of files: {len(files)}")
        arrays = do_preprocessing(files, path_import)
        arrays_list += arrays

    (
        X_stress_components_new,
        X_strain_components_new,
        y_stress_components_new,
        y_strain_components_new,
    ) = data_preparer(files_list, arrays_list)
    print(
        f"Arrays shapes: {X_stress_components_new.shape}, "
        f"{X_strain_components_new.shape}, "
        f"{y_stress_components_new.shape}, "
        f"{y_strain_components_new.shape}"
    )

    saver(
        X_stress_components_new,
        f"X_stress_components_{postfix}",
        path_import=path_export,
    )
    saver(
        X_strain_components_new,
        f"X_strain_components_{postfix}",
        path_import=path_export,
    )
    saver(
        y_stress_components_new,
        f"y_stress_components_{postfix}",
        path_import=path_export,
    )
    saver(
        y_strain_components_new,
        f"y_strain_components_{postfix}",
        path_import=path_export,
    )

In [4]:
from pathlib import Path
from os import listdir
from os.path import abspath, dirname, join

In [5]:
make_X_y_from_list(
    path_import_list=[
        Path("new_components_reports") / d for d in listdir("new_components_reports")
    ],
    path_export="new_components_resources",
    postfix="new_components",
)

Processing new_components_reports/Vel_40
Count of files: 524
............................................................................................................................................................................................................................................................................................................................................................................................................................................................................................................................................
Processing new_components_reports/Vel_5
Count of files: 97
.................................................................................................
Processing new_components_reports/Vel_10
Count of files: 406
....................................................................................................................................................................................................

In [6]:
y_stress_components_new_components = opener(
    "y_stress_components_new_components", "new_components_resources"
)

y_stress_components_new_components.shape

new_components_resources/y_stress_components_new_components.pkl


(3, 1597, 20)

In [7]:
X_stress_components_new_components = opener(
    "X_stress_components_new_components", "new_components_resources"
)

X_stress_components_new_components.shape

new_components_resources/X_stress_components_new_components.pkl


(3, 1597, 5)

In [8]:
from analysis_functions import split_transform_one_comp_cv


cur_X_test, cur_y_test, val_list_X, val_list_y, train_list_X, train_list_y = (
    split_transform_one_comp_cv(
        X_stress_components_new_components[1],
        y_stress_components_new_components[1],
        n_splits=1,
    )
)

val_list_X

[array([[ 0.025     ,  0.1       ,  4.        ,  0.05      , 20.        ,
          0.        ],
        [ 0.025     ,  0.1       ,  4.        ,  0.05      , 20.        ,
          0.05263158],
        [ 0.025     ,  0.1       ,  4.        ,  0.05      , 20.        ,
          0.10526316],
        ...,
        [ 0.05      ,  0.3       , 20.        ,  0.025     , 20.        ,
          0.89473684],
        [ 0.05      ,  0.3       , 20.        ,  0.025     , 20.        ,
          0.94736842],
        [ 0.05      ,  0.3       , 20.        ,  0.025     , 20.        ,
          1.        ]])]

In [None]:
make_X_y_from_list(
    path_import_list=[
        Path("Data_set_J-C_full") / r for r in listdir(Path("Data_set_J-C_full"))
    ],
    path_export="resources_J-C_full",
    postfix="J-C_full",
)

Processing Data_set_J-C_full/Vel_40
Count of files: 463
...............................................................................................................................................................................................................................................................................................................................................................................................................................................................................
Processing Data_set_J-C_full/Vel_20
Count of files: 423
.......................................................................................................................................................................................................................................................................................................................................................................................................................................


In [5]:
opener("y_stress_components_J-C_full", "resources_J-C_full").shape


resources_J-C_full/y_stress_components_J-C_full.pkl


(3, 886, 20)

In [6]:
opener("X_stress_components_J-C_full", "resources_J-C_full").shape


resources_J-C_full/X_stress_components_J-C_full.pkl


(3, 886, 5)