In [1]:
import joblib
import pandas as pd
from sklearn.preprocessing import StandardScaler


model = joblib.load('TenYearCHD.joblib')
scaler = joblib.load('scaler.joblib')

# create lib exactly the way you trained in that order, insert own realistic values

new_data = pd.DataFrame({
    "age": [85, 55, 35, 20],
    "sex": [0, 1, 0, 1],  # 0=Female, 1=Male
    "currentSmoker": [0, 1, 1, 1],  # 0=No, 1=Yes
    "cigsPerDay": [0, 7, 12, 5],  # Number of cigarettes per day
    "diabetes": [1, 0, 1, 0],  # 0=No, 1=Yes
    "totChol": [245, 180, 220, 165],  # Total cholesterol (mg/dL)
    "sysBP": [160, 130, 145, 110],  # Systolic blood pressure (mmHg)
    "BMI": [28.2, 28.8, 25.1, 24.0],  # Body Mass Index
    "prevalentHyp": [1, 0, 0, 0],  # 0=No hypertension, 1=Has hypertension
    "BPMeds": [1, 0, 0, 0],  # 0=Not on BP medication, 1=On BP medication
    "glucose": [110, 85, 95, 78]  # Fasting glucose (mg/dL)
})
print("New Data:")
print(new_data)

#reorder data
new_data = new_data[["age","sex","currentSmoker","cigsPerDay","diabetes","totChol","sysBP","BMI","prevalentHyp","BPMeds","glucose"]]
print(new_data)

# Scale the new data here
X_new = scaler.transform(new_data)
print("Scaled New Data Shape:", X_new.shape)

# Make predictions at this stage: based on the scaled data
predictions = model.predict(X_new)
prediction_probs = model.predict_proba(X_new)[:, 1] # Probability of CHD=1

# Combine predictions with original data
new_data_with_predictions = new_data.copy()
new_data_with_predictions['predicted_TenYearCHD'] = predictions
new_data_with_predictions['TenYearCHD_probability'] = prediction_probs

# Display results
print("\nPrediction Results:")
print(new_data_with_predictions)

New Data:
   age  sex  currentSmoker  cigsPerDay  diabetes  totChol  sysBP   BMI  \
0   85    0              0           0         1      245    160  28.2   
1   55    1              1           7         0      180    130  28.8   
2   35    0              1          12         1      220    145  25.1   
3   20    1              1           5         0      165    110  24.0   

   prevalentHyp  BPMeds  glucose  
0             1       1      110  
1             0       0       85  
2             0       0       95  
3             0       0       78  
   age  sex  currentSmoker  cigsPerDay  diabetes  totChol  sysBP   BMI  \
0   85    0              0           0         1      245    160  28.2   
1   55    1              1           7         0      180    130  28.8   
2   35    0              1          12         1      220    145  25.1   
3   20    1              1           5         0      165    110  24.0   

   prevalentHyp  BPMeds  glucose  
0             1       1      110  
1  

