## Null removal

In [2]:
import os
import pandas as pd

# Define the folder paths
DATASET_FOLDER = r"D:\Desktop\SEM 7\Mini Project\Dataset"
OUTPUT_FOLDER = r"D:\Desktop\SEM 7\Mini Project\Filtered_Dataset"

# Check if the dataset folder exists
if not os.path.exists(DATASET_FOLDER):
    print(f"Folder does not exist: {DATASET_FOLDER}")
    exit()

# Create the output folder if it doesn't exist
os.makedirs(OUTPUT_FOLDER, exist_ok=True)

# Null address to remove
null_address = '0x0000000000000000000000000000000000000000'

# List all CSV files in the dataset folder
csv_files = [f for f in os.listdir(DATASET_FOLDER) if f.endswith(".csv")]

# Loop through each file in the dataset folder
for file in csv_files:
    file_path = os.path.join(DATASET_FOLDER, file)
    
    # Read the CSV file into a DataFrame
    df = pd.read_csv(file_path)
    
    # Clean the 'from' and 'to' columns to ensure consistent formatting
    df['from'] = df['from'].astype(str).str.strip().str.lower()
    df['to'] = df['to'].astype(str).str.strip().str.lower()
    
    # Filter out rows where either 'from' or 'to' is the null address
    df_filtered = df[(df['from'] != null_address) & (df['to'] != null_address)]
    
    # Generate the output file path
    output_file_path = os.path.join(OUTPUT_FOLDER, file)
    
    # Save the filtered DataFrame
    df_filtered.to_csv(output_file_path, index=False)
    
    print(f"Processed and saved: {output_file_path}")

print("\n✅ All files filtered and saved successfully.")


Processed and saved: D:\Desktop\SEM 7\Mini Project\Filtered_Dataset\0to999999_ERC721Transaction.csv
Processed and saved: D:\Desktop\SEM 7\Mini Project\Filtered_Dataset\10000000to10999999_ERC721Transaction.csv
Processed and saved: D:\Desktop\SEM 7\Mini Project\Filtered_Dataset\1000000to1999999_ERC721Transaction.csv
Processed and saved: D:\Desktop\SEM 7\Mini Project\Filtered_Dataset\11000000to11999999_ERC721Transaction.csv
Processed and saved: D:\Desktop\SEM 7\Mini Project\Filtered_Dataset\12000000to12999999_ERC721Transaction.csv
Processed and saved: D:\Desktop\SEM 7\Mini Project\Filtered_Dataset\13000000to13249999_ERC721Transaction.csv
Processed and saved: D:\Desktop\SEM 7\Mini Project\Filtered_Dataset\13250000to13499999_ERC721Transaction.csv
Processed and saved: D:\Desktop\SEM 7\Mini Project\Filtered_Dataset\13500000to13749999_ERC721Transaction.csv
Processed and saved: D:\Desktop\SEM 7\Mini Project\Filtered_Dataset\2000000to2999999_ERC721Transaction.csv
Processed and saved: D:\Desktop\

  df = pd.read_csv(file_path)


Processed and saved: D:\Desktop\SEM 7\Mini Project\Filtered_Dataset\4000000to4999999_ERC721Transaction.csv


  df = pd.read_csv(file_path)


Processed and saved: D:\Desktop\SEM 7\Mini Project\Filtered_Dataset\5000000to5999999_ERC721Transaction.csv
Processed and saved: D:\Desktop\SEM 7\Mini Project\Filtered_Dataset\6000000to6999999_ERC721Transaction.csv
Processed and saved: D:\Desktop\SEM 7\Mini Project\Filtered_Dataset\7000000to7999999_ERC721Transaction.csv


  df = pd.read_csv(file_path)


Processed and saved: D:\Desktop\SEM 7\Mini Project\Filtered_Dataset\8000000to8999999_ERC721Transaction.csv
Processed and saved: D:\Desktop\SEM 7\Mini Project\Filtered_Dataset\9000000to9999999_ERC721Transaction.csv

✅ All files filtered and saved successfully.
