In [1]:
import os
import pandas as pd
import matplotlib.pyplot as plt
import math
import duckdb
import numpy as np
# Display all columns
pd.set_option('display.max_columns', None)

# Set max column width to a large value
pd.set_option('display.max_colwidth', None)

# Create a new DuckDB database file
con = duckdb.connect('my_database.duckdb')

In [2]:
import pandas as pd
import re

# Read the CSV file line by line
file_path = 'wbtcweth_decoded.csv'
lines = []

with open(file_path, 'r') as file:
    lines = file.readlines()

# Initialize dictionaries to store lines for each transaction type
transaction_dict = {}

# Function to parse fields without combining text between single quotes
def parse_line(line):
    fields = line.split(',')
    fields = [field.strip() for field in fields]
    return fields

# Iterate over each line to categorize it based on the 6th field
for line in lines:
    fields = parse_line(line.strip())
    if len(fields) > 5:  # Ensure there are at least 6 fields after cleaning
        transaction_type = fields[5]
        if transaction_type not in transaction_dict:
            transaction_dict[transaction_type] = []
        transaction_dict[transaction_type].append(fields)

# Create separate DataFrames for each transaction type
dataframes = {}
for transaction_type, data in transaction_dict.items():
    # Determine the number of columns for this transaction type
    num_columns = max(len(fields) for fields in data)
    # Pad the data with empty strings to ensure all rows have the same number of columns
    padded_data = [fields + [''] * (num_columns - len(fields)) for fields in data]
    # Create DataFrame
    df = pd.DataFrame(padded_data, columns=[f'Field_{i+1}' for i in range(num_columns)])
    dataframes[transaction_type] = df

# Print out the names of the created DataFrames
for transaction_type in dataframes.keys():
    print(f'Created DataFrame: {transaction_type}')

SwapFeePercentageChanged = dataframes['SwapFeePercentageChanged']


Created DataFrame: Transfer
Created DataFrame: SwapFeePercentageChanged
Created DataFrame: Approval


In [3]:
SwapFeePercentageChanged

Unnamed: 0,Field_1,Field_2,Field_3,Field_4,Field_5,Field_6,Field_7,Field_8,Field_9,Field_10,Field_11,Field_12,Field_13,Field_14,Field_15,Field_16
0,12505422,124,109,0x0e5c53950574cb933da47d5a885ae7f134849f43fa77eb818d9efd5cc65dbed0,0xA6F548DF93de924d73be7D25dC02554c6bD66dB5,SwapFeePercentageChanged,4100000000000000,,,,,,,,,
1,12654826,142,187,0x7aadce84f11aa371f3ae09e56fbd46db03da1d3723d6df345fbde0f9a71548c1,0xA6F548DF93de924d73be7D25dC02554c6bD66dB5,SwapFeePercentageChanged,3900000000000000,,,,,,,,,
2,12693310,154,299,0xd2bb72c0cfcea82cd4f7c3ff02fe7fe5b52bae983a71dfa0b746829d3233c0d5,0xA6F548DF93de924d73be7D25dC02554c6bD66dB5,SwapFeePercentageChanged,3500000000000000,,,,,,,,,
3,12814302,3,2,0x22e8bd2d2df1bdf4ae53ce8621078b7003dc74b8254de647d1d378dffef942de,0xA6F548DF93de924d73be7D25dC02554c6bD66dB5,SwapFeePercentageChanged,3300000000000000,,,,,,,,,
4,12859412,201,271,0xf4241a0d9993a2d2ef6c0ae84fd35686f1e164ce804735ec10486d568959979d,0xA6F548DF93de924d73be7D25dC02554c6bD66dB5,SwapFeePercentageChanged,3000000000000000,,,,,,,,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
925,19980897,24,182,0x36654991e5f8ba562c2fc6f8041c5f0bfcbc8378579f692d46a137b3c99ef033,0xA6F548DF93de924d73be7D25dC02554c6bD66dB5,SwapFeePercentageChanged,2500000000000000,,,,,,,,,
926,19981171,18,189,0x0a06bbeb8c48bf4363ba361714f5caf366076a2273dc1b6901d12a1e4cea9f51,0xA6F548DF93de924d73be7D25dC02554c6bD66dB5,SwapFeePercentageChanged,500000000000000,,,,,,,,,
927,19981171,18,195,0x0a06bbeb8c48bf4363ba361714f5caf366076a2273dc1b6901d12a1e4cea9f51,0xA6F548DF93de924d73be7D25dC02554c6bD66dB5,SwapFeePercentageChanged,2500000000000000,,,,,,,,,
928,19999851,7,63,0x7f6f897ed561572c2ad056623aac9977435d9beb735d7312c36c790b3231f22f,0xA6F548DF93de924d73be7D25dC02554c6bD66dB5,SwapFeePercentageChanged,500000000000000,,,,,,,,,


In [4]:
selected_columns = {'Field_1': 'block_number', 'Field_3': 'log_index', 'Field_4': 'transaction_hash', 'Field_6':'event', 'Field_7': 'fee'}
SwapFeePercentageChanged = SwapFeePercentageChanged[list(selected_columns.keys())].rename(columns=selected_columns)

In [5]:
SwapFeePercentageChanged

Unnamed: 0,block_number,log_index,transaction_hash,event,fee
0,12505422,109,0x0e5c53950574cb933da47d5a885ae7f134849f43fa77eb818d9efd5cc65dbed0,SwapFeePercentageChanged,4100000000000000
1,12654826,187,0x7aadce84f11aa371f3ae09e56fbd46db03da1d3723d6df345fbde0f9a71548c1,SwapFeePercentageChanged,3900000000000000
2,12693310,299,0xd2bb72c0cfcea82cd4f7c3ff02fe7fe5b52bae983a71dfa0b746829d3233c0d5,SwapFeePercentageChanged,3500000000000000
3,12814302,2,0x22e8bd2d2df1bdf4ae53ce8621078b7003dc74b8254de647d1d378dffef942de,SwapFeePercentageChanged,3300000000000000
4,12859412,271,0xf4241a0d9993a2d2ef6c0ae84fd35686f1e164ce804735ec10486d568959979d,SwapFeePercentageChanged,3000000000000000
...,...,...,...,...,...
925,19980897,182,0x36654991e5f8ba562c2fc6f8041c5f0bfcbc8378579f692d46a137b3c99ef033,SwapFeePercentageChanged,2500000000000000
926,19981171,189,0x0a06bbeb8c48bf4363ba361714f5caf366076a2273dc1b6901d12a1e4cea9f51,SwapFeePercentageChanged,500000000000000
927,19981171,195,0x0a06bbeb8c48bf4363ba361714f5caf366076a2273dc1b6901d12a1e4cea9f51,SwapFeePercentageChanged,2500000000000000
928,19999851,63,0x7f6f897ed561572c2ad056623aac9977435d9beb735d7312c36c790b3231f22f,SwapFeePercentageChanged,500000000000000


In [6]:
con.execute('CREATE TABLE wbtcweth_fee_change AS SELECT * FROM SwapFeePercentageChanged').fetchdf()

# Commit the changes
con.commit()

# Close the connection
con.close()