In [1]:
import pandas as pd
import os

# Confirm the file path
file_path = '/home/user/gzhao/Thesis/Price/token_price.csv'

if os.path.exists(file_path):
    # Load the data
    token_price = pd.read_csv(file_path)

    # Filter for priceUSD > 7000
    token_price = token_price[token_price['priceUSD'] > 7000]

    # Calculate statistics and retain token.id
    summary = token_price.groupby(['token.name', 'token.id']).agg(
        highest_price=('priceUSD', 'max'),
        lowest_price=('priceUSD', 'min'),
        count_above_7000=('priceUSD', lambda x: (x > 7000).sum())
    ).reset_index()

    # Add the difference between highest and lowest price
    summary['price_difference'] = summary['highest_price'] - summary['lowest_price']

    # Export to a CSV file
    output_path = './token_price_summary_with_id.csv'
    summary.to_csv(output_path, index=False)
    print(f"Summary successfully exported to: {output_path}")
else:
    print("File path error, please check if the file exists: ", file_path)

Summary successfully exported to: ./token_price_summary_with_id.csv


In [2]:
# Define the token.id values to be removed
remove_ids = [
    "0x9cea2ed9e47059260c97d697f82b8a14efa61ea5",
    "0x632fd938b98d740faee69112ed41257be3f83c7c",
    "0xf25c91c87e0b1fd9b4064af0f427157aab0193a7",
    "0x058349297672b6cc7ccb6e59a679c5add74a6898",
    "0x08389495d7456e1951ddf7c3a1314a4bfb646d8b",
    "0xe8847d2fa66d0d1f4a77221cae1e47d8d59cf7d7",
    "0xf51ebf9a26dbc02b13f8b3a9110dac47a4d62d78",
    "0x4b7ee45f30767f36f06f79b32bf1fca6f726deda",
    "0x4f7aff8f0c78b51c0e30f02f27a67b5a6a11552b",
    "0x239b0fa917d85c21cf6435464c2c6aa3d45f6720",
    "0x57933314b1a31f91871acd557e3d014100f97e08",
    "0x9631483f28b7f5cbf7d435ab249be8f709215bc3",
    "0x9891a469c481a77b1603a233837c61ec01555ce9",
    "0x0d4a11d5eeaac28ec3f61d100daf4d40471f1852",
    "0x2c974b2d0ba1716e644c1fc59982a89ddd2ff724",
    "0xa3c22370de5f9544f0c4de126b1e46ceadf0a51b"
]

# Load the CSV file
df = pd.read_csv(file_path)

# Filter out rows with token.id in the remove_ids list
filtered_df = df[~df['token.id'].isin(remove_ids)]

# Save the filtered DataFrame back to a new CSV file
output_path = '/home/user/gzhao/Thesis/Price/token_price_filtered.csv'
filtered_df.to_csv(output_path, index=False)

print(f"Filtered data saved to: {output_path}")

Filtered data saved to: /home/user/gzhao/Thesis/Price/token_price_filtered.csv
