In [None]:
import pandas as pd

# Sample data: engine burn stats for different rockets
data = {
    'engine': ['Merlin', 'Raptor', 'Vulcain', 'BE-4', 'RD-180'],
    'thrust_kN': [845, 2300, 1350, 2400, 4150],  # kilonewtons
    'burn_time_sec': [162, 170, 600, 180, 210],
    'fuel_type': ['RP-1', 'Methane', 'Hydrogen', 'Methane', 'RP-1']
}

df = pd.DataFrame(data)

# Add derived column: impulse = thrust × burn_time
df['total_impulse_kN_sec'] = df['thrust_kN'] * df['burn_time_sec']

# Add conditional labels like a simple ML classifier
def classify_performance(row):
    if row['total_impulse_kN_sec'] > 400000:
        return 'Heavy Lift'
    elif row['total_impulse_kN_sec'] > 200000:
        return 'Medium Lift'
    else:
        return 'Light Lift'

df['performance_class'] = df.apply(classify_performance, axis=1)

# Optional: Group by fuel type and get stats
fuel_summary = df.groupby('fuel_type')[['thrust_kN', 'burn_time_sec']].mean()

# Output
print("🚀 Engine Data with Performance Classification:\n")
print(df)
print("\n🔍 Average Performance by Fuel Type:\n")
print(fuel_summary)

🚀 Engine Data with Performance Classification:

    engine  thrust_kN  burn_time_sec fuel_type  total_impulse_kN_sec  \
0   Merlin        845            162      RP-1                136890   
1   Raptor       2300            170   Methane                391000   
2  Vulcain       1350            600  Hydrogen                810000   
3     BE-4       2400            180   Methane                432000   
4   RD-180       4150            210      RP-1                871500   

  performance_class  
0        Light Lift  
1       Medium Lift  
2        Heavy Lift  
3        Heavy Lift  
4        Heavy Lift  

🔍 Average Performance by Fuel Type:

           thrust_kN  burn_time_sec
fuel_type                          
Hydrogen      1350.0          600.0
Methane       2350.0          175.0
RP-1          2497.5          186.0
