In [9]:
import platform
import psutil
import time

def get_size(bytes, suffix="B"):
    """
    Scale bytes to its proper format (e.g., 1253656 => 1.20MB)
    """
    factor = 1024
    for unit in ["", "K", "M", "G", "T", "P"]:
        if bytes < factor:
            return f"{bytes:.2f}{unit}{suffix}"
        bytes /= factor

print("="*40, "SYSTEM INFORMATION", "="*40)

# 1. System Info
uname = platform.uname()
print(f"System: {uname.system}")
print(f"Node Name: {uname.node}")
print(f"Release: {uname.release}")
print(f"Version: {uname.version}")
print(f"Machine: {uname.machine}")
print(f"Processor: {uname.processor}")
print("-" * 80)

# 2. CPU Information
print("="*40, "CPU INFORMATION", "="*40)
print(f"Physical cores: {psutil.cpu_count(logical=False)}")
print(f"Total (Logical) cores: {psutil.cpu_count(logical=True)}")
cpufreq = psutil.cpu_freq()
print(f"Max Frequency: {cpufreq.max:.2f}Mhz")
print(f"Current Frequency: {cpufreq.current:.2f}Mhz")
print(f"Total CPU Usage: {psutil.cpu_percent(interval=1)}%")
print("-" * 80)

# 3. RAM (Memory) Information
print("="*40, "MEMORY INFORMATION", "="*40)
svmem = psutil.virtual_memory()
print(f"Total RAM: {get_size(svmem.total)}")
print(f"Available RAM: {get_size(svmem.available)}")
print(f"Used RAM: {get_size(svmem.used)}")
print(f"RAM Usage Percentage: {svmem.percent}%")
print("-" * 80)

# 4. Disk Information (for the current partition/drive)
print("="*40, "DISK INFORMATION", "="*40)
# Get usage for the current working directory's partition
disk_usage = psutil.disk_usage('/')
print(f"Total Disk Space: {get_size(disk_usage.total)}")
print(f"Used Disk Space: {get_size(disk_usage.used)}")
print(f"Free Disk Space: {get_size(disk_usage.free)}")
print(f"Disk Usage Percentage: {disk_usage.percent}%")
print("="*80)

System: Linux
Node Name: codespaces-a44c5a
Release: 6.8.0-1030-azure
Version: #35~22.04.1-Ubuntu SMP Mon May 26 18:08:30 UTC 2025
Machine: x86_64
Processor: x86_64
--------------------------------------------------------------------------------
Physical cores: 1
Total (Logical) cores: 2
Max Frequency: 0.00Mhz
Current Frequency: 3238.88Mhz
Total CPU Usage: 5.0%
--------------------------------------------------------------------------------
Total RAM: 7.76GB
Available RAM: 3.76GB
Used RAM: 3.63GB
RAM Usage Percentage: 51.6%
--------------------------------------------------------------------------------
Total Disk Space: 31.33GB
Used Disk Space: 16.74GB
Free Disk Space: 12.97GB
Disk Usage Percentage: 56.4%


In [1]:
import pandas as pd

In [3]:
pd.__version__

'2.3.2'

In [2]:
df = pd.read_parquet("https://d37ci6vzurychx.cloudfront.net/trip-data/yellow_tripdata_2025-01.parquet")
df.shape

(3475226, 20)

In [4]:
df.head()

Unnamed: 0,VendorID,tpep_pickup_datetime,tpep_dropoff_datetime,passenger_count,trip_distance,RatecodeID,store_and_fwd_flag,PULocationID,DOLocationID,payment_type,fare_amount,extra,mta_tax,tip_amount,tolls_amount,improvement_surcharge,total_amount,congestion_surcharge,Airport_fee,cbd_congestion_fee
0,1,2025-01-01 00:18:38,2025-01-01 00:26:59,1.0,1.6,1.0,N,229,237,1,10.0,3.5,0.5,3.0,0.0,1.0,18.0,2.5,0.0,0.0
1,1,2025-01-01 00:32:40,2025-01-01 00:35:13,1.0,0.5,1.0,N,236,237,1,5.1,3.5,0.5,2.02,0.0,1.0,12.12,2.5,0.0,0.0
2,1,2025-01-01 00:44:04,2025-01-01 00:46:01,1.0,0.6,1.0,N,141,141,1,5.1,3.5,0.5,2.0,0.0,1.0,12.1,2.5,0.0,0.0
3,2,2025-01-01 00:14:27,2025-01-01 00:20:01,3.0,0.52,1.0,N,244,244,2,7.2,1.0,0.5,0.0,0.0,1.0,9.7,0.0,0.0,0.0
4,2,2025-01-01 00:21:34,2025-01-01 00:25:06,3.0,0.66,1.0,N,244,116,2,5.8,1.0,0.5,0.0,0.0,1.0,8.3,0.0,0.0,0.0
