In [9]:
import os
import numpy as np

# Define the directories
dir1 = r'F:\Awais_data\Datasets\PartialSpoof\database_segment_labels\database\segment_labels'

# List the files in the directory
files_dir1 = ['train_seglab_0.16.npy', 'dev_seglab_0.16.npy', 'eval_seglab_0.16.npy']

# Function to load and explore numpy files
def explore_npy_files(directory, files):
    print(f"Exploring files in: {directory}\n")
    for file in files:
        file_path = os.path.join(directory, file)
        if os.path.exists(file_path):
            try:
                data = np.load(file_path, allow_pickle=True)  # Allow pickle loading
                print(f"File: {file}")
                
                # For 0-dimensional objects
                if data.shape == ():  
                    print(f"Loaded object type: {type(data)}")
                else:
                    print(f"Shape: {data.shape}")
                    print(f"Data type: {data.dtype}")
                    
                    # Print only a small portion of the data to avoid large output
                    if data.size > 0:
                        print(f"First 5 entries (if applicable): {data.flat[:5]}")
                
                print('-' * 50)
            except Exception as e:
                print(f"Could not load {file}. Error: {e}")
        else:
            print(f"File not found: {file}")
        print()

# Explore the files in the directory
explore_npy_files(dir1, files_dir1)


Exploring files in: F:\Awais_data\Datasets\PartialSpoof\database_segment_labels\database\segment_labels

File: train_seglab_0.16.npy
Loaded object type: <class 'numpy.ndarray'>
--------------------------------------------------

File: dev_seglab_0.16.npy
Loaded object type: <class 'numpy.ndarray'>
--------------------------------------------------

File: eval_seglab_0.16.npy
Loaded object type: <class 'numpy.ndarray'>
--------------------------------------------------



In [14]:
explore_npy_files(dir2, files_dir2)

Exploring files in: F:\Awais_data\Datasets\PartialSpoof\database_segment_labels_v1.2\database\segment_labels

File: train_seglab_0.01.npy
Shape: ()
Data type: object
Number of keys: 25380
Sample keys: ['LA_T_1000406', 'LA_T_1007571', 'LA_T_1007663', 'LA_T_1011221', 'LA_T_1013597']
Key: LA_T_1000406, Sample value: ['1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1'
 '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1'
 '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1'
 '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1'
 '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1'
 '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1'
 '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1'
 '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1'
 '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1'
 '1' '1' '1' '1' '1' '1' '1'

In [12]:
import os
import numpy as np
from collections import defaultdict

# Define the directories
dir1 = r'F:\Awais_data\Datasets\PartialSpoof\database_segment_labels\database\segment_labels'

# List the files in the directory
files_dir1 = ['train_seglab_0.16.npy', 'dev_seglab_0.16.npy', 'eval_seglab_0.16.npy']

# Function to explore defaultdict objects
def explore_defaultdict_content(data):
    if isinstance(data, defaultdict):
        print(f"Number of keys: {len(data)}")
        sample_keys = list(data.keys())[:5]  # Print a sample of 5 keys
        print(f"Sample keys: {sample_keys}")
        for key in sample_keys:
            print(f"Key: {key}, Sample value: {data[key]}")
        print('-' * 50)
    else:
        print("The data is not a defaultdict.")

# Function to load and explore numpy files
def explore_npy_files(directory, files):
    print(f"Exploring files in: {directory}\n")
    for file in files:
        file_path = os.path.join(directory, file)
        if os.path.exists(file_path):
            try:
                data = np.load(file_path, allow_pickle=True)  # Allow pickle loading
                print(f"File: {file}")
                
                # Check basic properties
                print(f"Shape: {data.shape}")
                print(f"Data type: {data.dtype}")
                
                # Since the data is an object (defaultdict), explore its content
                actual_data = data.item()  # Get the actual defaultdict object from the 0-dim array
                explore_defaultdict_content(actual_data)
                
            except Exception as e:
                print(f"Could not load {file}. Error: {e}")
        else:
            print(f"File not found: {file}")
        print()

# Explore the files in the directory
explore_npy_files(dir1, files_dir1)


Exploring files in: F:\Awais_data\Datasets\PartialSpoof\database_segment_labels\database\segment_labels

File: train_seglab_0.16.npy
Shape: ()
Data type: object
Number of keys: 25380
Sample keys: ['LA_T_1000406', 'LA_T_1007571', 'LA_T_1007663', 'LA_T_1011221', 'LA_T_1013597']
Key: LA_T_1000406, Sample value: ['1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1']
Key: LA_T_1007571, Sample value: ['1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1'
 '1' '1' '1' '1' '1' '1' '1' '1']
Key: LA_T_1007663, Sample value: ['1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1'
 '1' '1' '1' '1' '1']
Key: LA_T_1011221, Sample value: ['1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1'
 '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1'
 '1' '1']
Key: LA_T_1013597, Sample value: ['1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1' '1'
 '1' '1' '1' '1' '1']
-------------------------------

In [13]:
import os
import numpy as np
import pandas as pd
from collections import defaultdict

# Define the directories
dir1 = r'F:\Awais_data\Datasets\PartialSpoof\database_segment_labels\database\segment_labels'
output_dir = dir1  # Save the Excel files in the same location

# List the files in the directory
files_dir1 = ['train_seglab_0.16.npy', 'dev_seglab_0.16.npy', 'eval_seglab_0.16.npy']

# Function to convert defaultdict to a Pandas DataFrame
def defaultdict_to_dataframe(dd):
    if isinstance(dd, defaultdict):
        df = pd.DataFrame(list(dd.items()), columns=['Key', 'Value'])
        return df
    return None

# Function to load, convert, and save numpy files to Excel
def explore_and_save_to_excel(directory, files):
    print(f"Exploring files in: {directory}\n")
    for file in files:
        file_path = os.path.join(directory, file)
        if os.path.exists(file_path):
            try:
                # Load the numpy file
                data = np.load(file_path, allow_pickle=True)  # Allow pickle loading
                
                # Extract defaultdict object
                actual_data = data.item()  # Get the actual defaultdict object from the 0-dim array
                
                # Convert defaultdict to DataFrame
                df = defaultdict_to_dataframe(actual_data)
                if df is not None:
                    # Define the output file path
                    excel_file_path = os.path.join(output_dir, file.replace('.npy', '.xlsx'))
                    
                    # Save DataFrame to Excel
                    df.to_excel(excel_file_path, index=False)
                    print(f"Saved {file} to {excel_file_path}")
                else:
                    print(f"Data in {file} is not a defaultdict.")
                    
            except Exception as e:
                print(f"Could not process {file}. Error: {e}")
        else:
            print(f"File not found: {file}")
        print()

# Explore the files in the directory and save to Excel
explore_and_save_to_excel(dir1, files_dir1)


Exploring files in: F:\Awais_data\Datasets\PartialSpoof\database_segment_labels\database\segment_labels

Saved train_seglab_0.16.npy to F:\Awais_data\Datasets\PartialSpoof\database_segment_labels\database\segment_labels\train_seglab_0.16.xlsx

Saved dev_seglab_0.16.npy to F:\Awais_data\Datasets\PartialSpoof\database_segment_labels\database\segment_labels\dev_seglab_0.16.xlsx

Saved eval_seglab_0.16.npy to F:\Awais_data\Datasets\PartialSpoof\database_segment_labels\database\segment_labels\eval_seglab_0.16.xlsx



In [2]:
import os
import numpy as np
import pandas as pd
from collections import defaultdict

# Define the directories
dir1 = r'F:\Awais_data\Datasets\PartialSpoof\database_segment_labels\database\segment_labels'
dir2 = r'F:\Awais_data\Datasets\PartialSpoof\database_segment_labels_v1.2\database\segment_labels'

# List the files in both directories
# files_dir1 = ['train_seglab_0.16.npy', 'dev_seglab_0.16.npy', 'eval_seglab_0.16.npy']
# files_dir2 = [
#     'train_seglab_0.01.npy', 'train_seglab_0.02.npy', 'train_seglab_0.04.npy', 'train_seglab_0.08.npy',
#     'train_seglab_0.16.npy', 'train_seglab_0.32.npy', 'dev_seglab_0.01.npy', 'dev_seglab_0.02.npy',
#     'dev_seglab_0.04.npy', 'dev_seglab_0.08.npy', 'dev_seglab_0.16.npy', 'dev_seglab_0.32.npy',
#     'eval_seglab_0.01.npy', 'eval_seglab_0.02.npy', 'eval_seglab_0.04.npy', 'eval_seglab_0.08.npy',
#     'eval_seglab_0.16.npy', 'eval_seglab_0.32.npy'
# ]

files_dir2 = [
    'dev_seglab_0.64.npy', 'train_seglab_0.64.npy'
]
# Function to convert defaultdict to a Pandas DataFrame
def defaultdict_to_dataframe(dd):
    if isinstance(dd, defaultdict):
        df = pd.DataFrame(list(dd.items()), columns=['Key', 'Value'])
        return df
    return None

# Function to load, convert, and save numpy files to Excel
def explore_and_save_to_excel(directory, files):
    print(f"Exploring files in: {directory}\n")
    for file in files:
        file_path = os.path.join(directory, file)
        if os.path.exists(file_path):
            try:
                # Load the numpy file
                data = np.load(file_path, allow_pickle=True)  # Allow pickle loading
                
                # Extract defaultdict object
                actual_data = data.item()  # Get the actual defaultdict object from the 0-dim array
                
                # Convert defaultdict to DataFrame
                df = defaultdict_to_dataframe(actual_data)
                if df is not None:
                    # Define the output file path
                    excel_file_path = os.path.join(directory, file.replace('.npy', '.xlsx'))
                    
                    # Save DataFrame to Excel
                    df.to_excel(excel_file_path, index=False)
                    print(f"Saved {file} to {excel_file_path}")
                else:
                    print(f"Data in {file} is not a defaultdict.")
                    
            except Exception as e:
                print(f"Could not process {file}. Error: {e}")
        else:
            print(f"File not found: {file}")
        print()

# Explore and save to Excel for both directories
# explore_and_save_to_excel(dir1, files_dir1)
explore_and_save_to_excel(dir2, files_dir2)


Exploring files in: F:\Awais_data\Datasets\PartialSpoof\database_segment_labels_v1.2\database\segment_labels

Saved dev_seglab_0.64.npy to F:\Awais_data\Datasets\PartialSpoof\database_segment_labels_v1.2\database\segment_labels\dev_seglab_0.64.xlsx

Saved train_seglab_0.64.npy to F:\Awais_data\Datasets\PartialSpoof\database_segment_labels_v1.2\database\segment_labels\train_seglab_0.64.xlsx

