In [8]:
import os
import pandas as pd

def time_features(dataset_path, set_number=1):
    """
    Process all valid files in `dataset_path` to compute time features.
    """
    # List all items in the directory
    files = os.listdir(dataset_path)

    # Initialize a list (or DataFrame) to store the results
    all_features = []

    for file_name in files:
        # Construct full path
        full_path = os.path.join(dataset_path, file_name)

        # Skip directories (including .ipynb_checkpoints) or hidden files
        if os.path.isdir(full_path):
            continue
        if file_name.startswith("."):
            # This also helps skip hidden files/folders on some OS
            continue

        # (Optional) Check file extension if needed
        # if not file_name.endswith(".csv"):
        #     continue

        # Now read the file
        try:
            df = pd.read_csv(full_path, sep='\t', header=None)
            # If needed, rename columns:
            df.columns = ["Bearing 1", "Bearing 2", "Bearing 3", "Bearing 4"]

            # TODO: Perform your time-feature calculations here
            features = compute_time_features(df, set_number)

            # Accumulate results
            all_features.append(features)

        except Exception as e:
            print(f"Error reading {full_path}: {e}")
            continue

    # Convert collected features into a single DataFrame or similar
    # e.g., pd.DataFrame(all_features)
    return all_features


def compute_time_features(df, set_number):
    """
    Example placeholder for your actual feature calculations.
    """
    # ... your computations ...
    # return dictionary or series of computed features
    return {"mean_b1": df["Bearing 1"].mean(), "set": set_number}


# Now call your function for each dataset
dataset_path_1st = "./1st_test/1st_test"
dataset_path_2nd = "./2nd_test/2nd_test"
dataset_path_3rd = "./3rd_test/4th_test/txt"

#set1_features = time_features(dataset_path_1st, set_number=1)
set2_features = time_features(dataset_path_2nd, set_number=2)
set3_features = time_features(dataset_path_3rd, set_number=3)

In [10]:
import pandas as pd

set2_df = pd.DataFrame(set2_features)
set2_df.to_csv("set2_timefeatures.csv", index=False)