ETH

In [None]:
df_eth=pd.read_csv("content/ETHUSD/T_1h_2017_2025.csv")

In [None]:
# -------------------------
# 1. Imports
# -------------------------
import pandas as pd
from sklearn.preprocessing import MinMaxScaler

# -------------------------
# 2. Load ETH dataset
# -------------------------
df = pd.read_csv('/content/ETHUSDT_1h_2017_2025.csv')  # Replace with your ETH CSV path

# Convert timestamp columns automatically
df['Open Time'] = pd.to_datetime(df['Open Time'], errors='coerce')
df['Close Time'] = pd.to_datetime(df['Close Time'], errors='coerce')

# Drop rows where timestamp conversion failed
df.dropna(subset=['Open Time','Close Time'], inplace=True)

# -------------------------
# 3. Keep only relevant columns
# -------------------------
df = df[['Open Time','Open','High','Low','Close','Volume','Quote Volume','Trades']]

# -------------------------
# 4. Handle missing values
# -------------------------
df.dropna(inplace=True)

# -------------------------
# 5. Feature Engineering
# -------------------------
df['HL_PCT'] = (df['High'] - df['Low']) / df['Close'] * 100
df['PCT_change'] = (df['Close'] - df['Open']) / df['Open'] * 100

# -------------------------
# 6. Scaling / Normalization
# -------------------------
features = ['Open','High','Low','Close','Volume','Quote Volume','Trades','HL_PCT','PCT_change']
scaler = MinMaxScaler()
scaled_features = scaler.fit_transform(df[features])
scaled_df = pd.DataFrame(scaled_features, columns=features)
scaled_df['Open Time'] = df['Open Time'].values

# -------------------------
# 7. Save entire cleaned & scaled dataset
# -------------------------
scaled_df.to_csv('ETH_cleaned_scaled.csv', index=False)
print("Entire ETH cleaned & scaled dataset saved successfully as 'ETH_cleaned_scaled.csv'")


Entire ETH cleaned & scaled dataset saved successfully as 'ETH_cleaned_scaled.csv'


XRP

In [None]:
import pandas as pd

# Load CSV
df = pd.read_csv('/content/XRPUSDT_1h_2017_2025.csv')

# Check column names
print(df.columns)


Index(['Open Time', 'Open', 'High', 'Low', 'Close', 'Volume', 'Close Time',
       'Quote Volume', 'Trades', 'Taker Buy Base', 'Taker Buy Quote',
       'Ignore'],
      dtype='object')


In [None]:
# -------------------------
# 1. Imports
# -------------------------
import pandas as pd
from sklearn.preprocessing import MinMaxScaler

# -------------------------
# 2. Load XRP dataset
# -------------------------
df = pd.read_csv('/content/XRPUSDT_1h_2017_2025.csv')

# Convert timestamp columns
df['Open Time'] = pd.to_datetime(df['Open Time'])
df['Close Time'] = pd.to_datetime(df['Close Time'])

# -------------------------
# 3. Drop unwanted columns
# -------------------------
df = df[['Open Time','Open','High','Low','Close','Volume','Quote Volume','Trades']]

# -------------------------
# 4. Handle missing values
# -------------------------
df.dropna(inplace=True)

# -------------------------
# 5. Feature Engineering
# -------------------------
df['HL_PCT'] = (df['High'] - df['Low']) / df['Close'] * 100
df['PCT_change'] = (df['Close'] - df['Open']) / df['Open'] * 100

# Select features for scaling
features = ['Open','High','Low','Close','Volume','Quote Volume','Trades','HL_PCT','PCT_change']
processed_df = df[['Open Time'] + features].copy()

# -------------------------
# 6. Scaling / Normalization
# -------------------------
scaler = MinMaxScaler()
scaled_features = scaler.fit_transform(processed_df[features])
scaled_df = pd.DataFrame(scaled_features, columns=features)
scaled_df['Open Time'] = processed_df['Open Time'].values

# -------------------------
# 7. Train-Test Split (time series style)
# -------------------------
train_size = int(len(scaled_df) * 0.8)
train_df = scaled_df[:train_size]
test_df = scaled_df[train_size:]

# -------------------------
# 8. Save processed files in Colab
# -------------------------
scaled_df.to_csv('XRP_cleaned_scaled.csv', index=False)

print("Entire cleaned & scaled dataset saved successfully as 'XRP_cleaned_scaled.csv'")

Entire cleaned & scaled dataset saved successfully as 'XRP_cleaned_scaled.csv'


LTC

In [None]:
# -------------------------
# 1. Imports
# -------------------------
import pandas as pd
from sklearn.preprocessing import MinMaxScaler

# -------------------------
# 2. Load LTC dataset
# -------------------------
df = pd.read_csv('/content/LTCUSDT_1h_2017_2025.csv')

# Convert timestamp columns automatically
df['Open Time'] = pd.to_datetime(df['Open Time'], errors='coerce')
df['Close Time'] = pd.to_datetime(df['Close Time'], errors='coerce')

# Drop any rows where timestamp conversion failed
df.dropna(subset=['Open Time','Close Time'], inplace=True)

# -------------------------
# 3. Drop unwanted columns
# -------------------------
df = df[['Open Time','Open','High','Low','Close','Volume','Quote Volume','Trades']]

# -------------------------
# 4. Handle missing values
# -------------------------
df.dropna(inplace=True)

# -------------------------
# 5. Feature Engineering
# -------------------------
df['HL_PCT'] = (df['High'] - df['Low']) / df['Close'] * 100
df['PCT_change'] = (df['Close'] - df['Open']) / df['Open'] * 100

# -------------------------
# 6. Scaling / Normalization
# -------------------------
features = ['Open','High','Low','Close','Volume','Quote Volume','Trades','HL_PCT','PCT_change']
scaler = MinMaxScaler()
scaled_features = scaler.fit_transform(df[features])
scaled_df = pd.DataFrame(scaled_features, columns=features)
scaled_df['Open Time'] = df['Open Time'].values

# -------------------------
# 7. Save entire cleaned & scaled dataset
# -------------------------
scaled_df.to_csv('LTC_cleaned_scaled.csv', index=False)
print("Entire LTC cleaned & scaled dataset saved successfully as 'LTC_cleaned_scaled.csv'")


Entire LTC cleaned & scaled dataset saved successfully as 'LTC_cleaned_scaled.csv'


BNB

In [None]:
# -------------------------
# 1. Imports
# -------------------------
import pandas as pd
from sklearn.preprocessing import MinMaxScaler

# -------------------------
# 2. Load BNB dataset
# -------------------------
df = pd.read_csv('/content/BNBUSDT_1h_2017_2025.csv')  # Replace with your file path

# Convert timestamp columns automatically
df['Open Time'] = pd.to_datetime(df['Open Time'], errors='coerce')
df['Close Time'] = pd.to_datetime(df['Close Time'], errors='coerce')

# Drop rows where timestamp conversion failed
df.dropna(subset=['Open Time','Close Time'], inplace=True)

# -------------------------
# 3. Keep only relevant columns
# -------------------------
df = df[['Open Time','Open','High','Low','Close','Volume','Quote Volume','Trades']]

# -------------------------
# 4. Handle missing values
# -------------------------
df.dropna(inplace=True)

# -------------------------
# 5. Feature Engineering
# -------------------------
df['HL_PCT'] = (df['High'] - df['Low']) / df['Close'] * 100
df['PCT_change'] = (df['Close'] - df['Open']) / df['Open'] * 100

# -------------------------
# 6. Scaling / Normalization
# -------------------------
features = ['Open','High','Low','Close','Volume','Quote Volume','Trades','HL_PCT','PCT_change']
scaler = MinMaxScaler()
scaled_features = scaler.fit_transform(df[features])
scaled_df = pd.DataFrame(scaled_features, columns=features)
scaled_df['Open Time'] = df['Open Time'].values

# -------------------------
# 7. Save entire cleaned & scaled dataset
# -------------------------
scaled_df.to_csv('BNB_cleaned_scaled.csv', index=False)
print("Entire BNB cleaned & scaled dataset saved successfully as 'BNB_cleaned_scaled.csv'")


Entire BNB cleaned & scaled dataset saved successfully as 'BNB_cleaned_scaled.csv'


BTC

In [None]:
# -------------------------
# 1. Imports
# -------------------------
import pandas as pd
from sklearn.preprocessing import MinMaxScaler

# -------------------------
# 2. Load BTC dataset
# -------------------------
df = pd.read_csv('/content/BTCUSDT_1h_2017_2025.csv')  # Replace with your file path

# Convert timestamp columns automatically
df['Open Time'] = pd.to_datetime(df['Open Time'], errors='coerce')
df['Close Time'] = pd.to_datetime(df['Close Time'], errors='coerce')

# Drop rows where timestamp conversion failed
df.dropna(subset=['Open Time','Close Time'], inplace=True)

# -------------------------
# 3. Keep only relevant columns
# -------------------------
df = df[['Open Time','Open','High','Low','Close','Volume','Quote Volume','Trades']]

# -------------------------
# 4. Handle missing values
# -------------------------
df.dropna(inplace=True)

# -------------------------
# 5. Feature Engineering
# -------------------------
df['HL_PCT'] = (df['High'] - df['Low']) / df['Close'] * 100
df['PCT_change'] = (df['Close'] - df['Open']) / df['Open'] * 100

# -------------------------
# 6. Scaling / Normalization
# -------------------------
features = ['Open','High','Low','Close','Volume','Quote Volume','Trades','HL_PCT','PCT_change']
scaler = MinMaxScaler()
scaled_features = scaler.fit_transform(df[features])
scaled_df = pd.DataFrame(scaled_features, columns=features)
scaled_df['Open Time'] = df['Open Time'].values

# -------------------------
# 7. Save entire cleaned & scaled dataset
# -------------------------
scaled_df.to_csv('BTC_cleaned_scaled.csv', index=False)
print("Entire BTC cleaned & scaled dataset saved successfully as 'BTC_cleaned_scaled.csv'")


Entire BTC cleaned & scaled dataset saved successfully as 'BTC_cleaned_scaled.csv'
