In [None]:
list = [4, 13, 0, 9, 0, 1, 2, 34]
number = list[::2]
print(number)

[4, 0, 0, 2]


In [None]:
list1 = [4, 13, 0, 9, 'a', 1, 2, 34]
for num in list1:
  if isinstance(num, (int, float)) and num !=0:
    print(f"1/{num}")
  else:
    print(f"not possible {num}")

1/4
1/13
not possible 0
1/9
not possible a
1/1
1/2
1/34


In [None]:
number = [4, 13, 0, 9, 0, 1, 2, 34]
for i in range(len(number)):
  for j in range(0, len(number)-i-1):
    if (type(number[j] == int or type[number[j]] == float) and (type(number[j+1] == int or type[number[j+1]] == float))):
      if number[j] > number[j+1]:
       number[j],number[j+1] = number[j+1], number[j]
       print(number)


[4, 0, 13, 9, 0, 1, 2, 34]
[4, 0, 9, 13, 0, 1, 2, 34]
[4, 0, 9, 0, 13, 1, 2, 34]
[4, 0, 9, 0, 1, 13, 2, 34]
[4, 0, 9, 0, 1, 2, 13, 34]
[0, 4, 9, 0, 1, 2, 13, 34]
[0, 4, 0, 9, 1, 2, 13, 34]
[0, 4, 0, 1, 9, 2, 13, 34]
[0, 4, 0, 1, 2, 9, 13, 34]
[0, 0, 4, 1, 2, 9, 13, 34]
[0, 0, 1, 4, 2, 9, 13, 34]
[0, 0, 1, 2, 4, 9, 13, 34]


In [2]:
pip install transformers



In [1]:
# Install necessary libraries if not already installed
# pip install pandas numpy transformers

import pandas as pd
import numpy as np
from transformers import pipeline

# Step 1: Generate Synthetic Patient Health Records

def generate_synthetic_health_records(num_records):
    # Sample data
    names = ["John Doe", "Jane Smith", "Alice Johnson", "Bob Brown", "Charlie Davis"]
    genders = ["Male", "Female", "Other"]
    heights = np.random.randint(150, 200, size=num_records)  # Height in cm
    weights = np.random.randint(50, 120, size=num_records)   # Weight in kg

    # Dictionary of conditions and their corresponding medications
    conditions = {
        "Diabetes": ["Metformin", "Insulin", "Glyburide", "Acarbose"],
        "Hypertension": ["Lisinopril", "Amlodipine", "Losartan", "Hydrochlorothiazide"],
        "Asthma": ["Albuterol", "Salmeterol", "Fluticasone", "Montelukast"],
        "Heart Disease": ["Aspirin", "Atorvastatin", "Beta Blockers", "ACE Inhibitors"],
        "None": ["No medication"]
    }

    allergies = ["None", "Peanuts", "Shellfish", "Penicillin", "Aspirin"]
    lifestyles = ["Smoker", "Non-Smoker", "Occasional Drinker", "Regular Drinker", "Active", "Sedentary"]

    records = []

    for i in range(num_records):
        name = np.random.choice(names)
        age = np.random.randint(20, 80)
        gender = np.random.choice(genders)
        condition = np.random.choice(list(conditions.keys()))
        medication = np.random.choice(conditions[condition])  # Randomly select medication for the condition
        visit_date = pd.Timestamp.now() - pd.DateOffset(days=np.random.randint(1, 365))  # Random past date
        blood_pressure = f"{np.random.randint(110, 180)}/{np.random.randint(60, 120)}"  # Random BP
        cholesterol_level = np.random.randint(150, 300)  # Random cholesterol level
        allergy = np.random.choice(allergies)
        lifestyle = np.random.choice(lifestyles)

        records.append({
            "Name": name,
            "Age": age,
            "Gender": gender,
            "Height (cm)": heights[i],
            "Weight (kg)": weights[i],
            "Condition": condition,
            "Medication": medication,
            "Visit Date": visit_date,
            "Blood Pressure": blood_pressure,
            "Cholesterol Level": cholesterol_level,
            "Allergies": allergy,
            "Lifestyle": lifestyle
        })

    return pd.DataFrame(records)

# Create Synthetic Data
num_records = 10000  # Number of synthetic records to generate
synthetic_data = generate_synthetic_health_records(num_records)

# Display the first few generated synthetic data records
print("Synthetic Patient Health Records:")
print(synthetic_data.head())

# Save to Excel
output_file = "synthetic_patient_health_records.xlsx"
synthetic_data.to_excel(output_file, index=False)

print(f"\nSynthetic patient health records saved to {output_file}.")



# Step 3: Summarize the Patient Health Records using LLM
def summarize_records(data):
    # Load a pre-trained summarization model
    summarizer = pipeline("summarization")

    # Prepare the records for summarization
    summaries = []
    for index, row in data.iterrows():
        record_summary = f"Patient {row['Name']}, Age {row['Age']}, Condition: {row['Condition']}, Medication: {row['Medication']}"
        summaries.append(record_summary)

    # Generate a summary of the health records
    full_summary = "\n".join(summaries)

    # Limit the input length if necessary
    max_input_length = 500  # You can adjust this based on model capability
    if len(full_summary) > max_input_length:
        full_summary = full_summary[:max_input_length]  # Truncate if too long

    summary = summarizer(full_summary, max_length=50, min_length=25, do_sample=False)

    return summary[0]['summary_text']

# Step 4: Generate and Print Summary
summary = summarize_records(synthetic_data)
print("\nSummary of Patient Health Records:")
print(summary)


Synthetic Patient Health Records:
            Name  Age Gender  Height (cm)  Weight (kg)     Condition  \
0      Bob Brown   34  Other          182           82      Diabetes   
1  Alice Johnson   65   Male          169          114  Hypertension   
2  Charlie Davis   49  Other          177           86  Hypertension   
3  Alice Johnson   61   Male          198           66  Hypertension   
4  Alice Johnson   50   Male          164           51        Asthma   

   Medication                 Visit Date Blood Pressure  Cholesterol Level  \
0   Metformin 2024-02-28 13:14:51.258974         115/87                162   
1    Losartan 2024-08-19 13:14:51.259489         131/96                190   
2  Lisinopril 2024-08-09 13:14:51.259714        117/116                179   
3    Losartan 2024-08-27 13:14:51.259914        132/107                248   
4  Salmeterol 2024-05-31 13:14:51.260132         134/69                267   

   Allergies   Lifestyle  
0    Aspirin  Non-Smoker  
1  Shellfi

No model was supplied, defaulted to sshleifer/distilbart-cnn-12-6 and revision a4f8f3e (https://huggingface.co/sshleifer/distilbart-cnn-12-6).
Using a pipeline without specifying a model name and revision in production is not recommended.



Synthetic patient health records saved to synthetic_patient_health_records.xlsx.


The secret `HF_TOKEN` does not exist in your Colab secrets.
To authenticate with the Hugging Face Hub, create a token in your settings tab (https://huggingface.co/settings/tokens), set it as secret in your Google Colab and restart your session.
You will be able to reuse this secret in all of your notebooks.
Please note that authentication is recommended but still optional to access public models or datasets.



Summary of Patient Health Records:
 Alice Johnson, Age 65, Condition: Hypertension, Medication: Losartan. Patients Charlie Davis, Age 49, and Bob Brown, Age 34, Conditions: Diabetes, Medications: Metformin.                Patient
