In [1]:
from transformers import AutoModelForCausalLM, AutoTokenizer, Trainer, TrainingArguments, DataCollatorWithPadding
from datasets import load_dataset
import torch
import numpy as np

  from .autonotebook import tqdm as notebook_tqdm


In [4]:
checkpoint = 'TinyLlama/TinyLlama-1.1B-Chat-v1.0'

model = AutoModelForCausalLM.from_pretrained(checkpoint)
tokenizer = AutoTokenizer.from_pretrained(checkpoint)

In [2]:
from transformers import pipeline, AutoModel

In [5]:
device = 'cuda' if torch.cuda.is_available() else 'cpu'
model.to(device)
print('using', device)

using cpu


In [6]:

med_pipeline = pipeline(
    'text-generation', model='medalpaca/medalpaca-7b', tokenizer='medalpaca/medalpaca-7b', max_length=500
)

Loading checkpoint shards: 100%|██████████| 3/3 [01:11<00:00, 23.74s/it]
You are using the default legacy behaviour of the <class 'transformers.models.llama.tokenization_llama.LlamaTokenizer'>. This is expected, and simply means that the `legacy` (previous) behavior will be used so nothing changes for you. If you want to use the new behaviour, set `legacy=False`. This should only be set if you understand what it means, and thoroughly read the reason why this was added as explained in https://github.com/huggingface/transformers/pull/24565


In [7]:
response0 = """Answer the question using the context below.
Context: A 23-year-old pregnant woman at 22 weeks gestation presents with burning upon urination. She states it started 1 day ago and has been worsening despite drinking more water and taking cranberry extract. She otherwise feels well and is followed by a doctor for her pregnancy. Her temperature is 97.7°F (36.5°C), blood pressure is 122/77 mmHg, pulse is 80/min, respirations are 19/min, and oxygen saturation is 98% on room air. Physical exam is notable for an absence of costovertebral angle tenderness and a gravid uterus.
Question: Which of the following is the best treatment for this patient? options: {A: Ampicillin, B: Ceftriaxone, C: Ciprofloxacin, D: Doxycycline, E: Nitrofurantoin}
Answer:
"""
med_output1 = med_pipeline(response0)
med_output1


[{'generated_text': 'Answer the question using the context below.\nContext: A 23-year-old pregnant woman at 22 weeks gestation presents with burning upon urination. She states it started 1 day ago and has been worsening despite drinking more water and taking cranberry extract. She otherwise feels well and is followed by a doctor for her pregnancy. Her temperature is 97.7°F (36.5°C), blood pressure is 122/77 mmHg, pulse is 80/min, respirations are 19/min, and oxygen saturation is 98% on room air. Physical exam is notable for an absence of costovertebral angle tenderness and a gravid uterus.\nQuestion: Which of the following is the best treatment for this patient? options: {A: Ampicillin, B: Ceftriaxone, C: Ciprofloxacin, D: Doxycycline, E: Nitrofurantoin}\nAnswer:\nA'}]

In [9]:
response1 = """Answer the question using the context below.
Context: A 3-month-old baby died suddenly at night while asleep. His mother noticed that he had died only after she awoke in the morning. No cause of death was determined based on the autopsy.
Question: Which of the following precautions could have prevented the death of the baby? Options: {A: Placing the infant in a supine position on a firm mattress while sleeping, B: Routine postnatal electrocardiogram (ECG), C: Keeping the infant covered and maintaining a high room temperature, D: Application of a device to maintain the sleeping position, E: Avoiding pacifier use during sleep}
Answer:
"""

med_output2 = med_pipeline(response1)
med_output2

[{'generated_text': 'Answer the question using the context below.\nContext: A 3-month-old baby died suddenly at night while asleep. His mother noticed that he had died only after she awoke in the morning. No cause of death was determined based on the autopsy.\nQuestion: Which of the following precautions could have prevented the death of the baby? Options: {A: Placing the infant in a supine position on a firm mattress while sleeping, B: Routine postnatal electrocardiogram (ECG), C: Keeping the infant covered and maintaining a high room temperature, D: Application of a device to maintain the sleeping position, E: Avoiding pacifier use during sleep}\nAnswer:\nA'}]

In [10]:
response2 = """Answer the question using the context below.
Context: A mother brings her 3-week-old infant to the pediatrician's office because she is concerned about his feeding habits. He was born without complications and has not had any medical problems up until this time. However, for the past 4 days, he has been fussy, is regurgitating all of his feeds, and his vomit is yellow in color. On physical exam, the child's abdomen is minimally distended but no other abnormalities are appreciated.
Question: Which of the following embryologic errors could account for this presentation? Options: {A: Abnormal migration of ventral pancreatic bud, B: Complete failure of proximal duodenum to recanalize, C: Error in neural crest cell migration, D: Abnormal hypertrophy of the pylorus, E: Failure of lateral body folds to move ventrally and fuse in the midline}
Answer:
"""
med_output3 = med_pipeline(response2)
med_output3

[{'generated_text': "Answer the question using the context below.\nContext: A mother brings her 3-week-old infant to the pediatrician's office because she is concerned about his feeding habits. He was born without complications and has not had any medical problems up until this time. However, for the past 4 days, he has been fussy, is regurgitating all of his feeds, and his vomit is yellow in color. On physical exam, the child's abdomen is minimally distended but no other abnormalities are appreciated.\nQuestion: Which of the following embryologic errors could account for this presentation? Options: {A: Abnormal migration of ventral pancreatic bud, B: Complete failure of proximal duodenum to recanalize, C: Error in neural crest cell migration, D: Abnormal hypertrophy of the pylorus, E: Failure of lateral body folds to move ventrally and fuse in the midline}\nAnswer:\nC"}]

In [11]:
response3 = """Answer the question using the context below.
Context: A pulmonary autopsy specimen from a 58-year-old woman who died of acute hypoxic respiratory failure was examined. She had recently undergone surgery for a fractured femur 3 months ago. Initial hospital course was uncomplicated, and she was discharged to a rehab facility in good health. Shortly after discharge home from rehab, she developed sudden shortness of breath and had cardiac arrest. Resuscitation was unsuccessful. On histological examination of lung tissue, fibrous connective tissue around the lumen of the pulmonary artery is observed.
Question: Which of the following is the most likely pathogenesis for the present findings? Options: {A: Thromboembolism, B: Pulmonary ischemia, C: Pulmonary hypertension, D: Pulmonary passive congestion, E: Pulmonary hemorrhage}
Answer:
"""
med_output4 = med_pipeline(response3)
med_output4

[{'generated_text': 'Answer the question using the context below.\nContext: A pulmonary autopsy specimen from a 58-year-old woman who died of acute hypoxic respiratory failure was examined. She had recently undergone surgery for a fractured femur 3 months ago. Initial hospital course was uncomplicated, and she was discharged to a rehab facility in good health. Shortly after discharge home from rehab, she developed sudden shortness of breath and had cardiac arrest. Resuscitation was unsuccessful. On histological examination of lung tissue, fibrous connective tissue around the lumen of the pulmonary artery is observed.\nQuestion: Which of the following is the most likely pathogenesis for the present findings? Options: {A: Thromboembolism, B: Pulmonary ischemia, C: Pulmonary hypertension, D: Pulmonary passive congestion, E: Pulmonary hemorrhage}\nAnswer:\nA'}]

In [12]:
response4 = """Answer the question using the context below.
Context: A 20-year-old woman presents with menorrhagia for the past several years. She says that her menses “have always been heavy”, and she has experienced easy bruising for as long as she can remember. Family history is significant for her mother, who had similar problems with bruising easily. The patient's vital signs include: heart rate 98/min, respiratory rate 14/min, temperature 36.1°C (96.9°F), and blood pressure 110/87 mm Hg. Physical examination is unremarkable. Laboratory tests show the following: platelet count 200,000/mm3, PT 12 seconds, and PTT 43 seconds.
Question: Which of the following is the most likely cause of this patient’s symptoms? Options: {A: Factor V Leiden, B: Hemophilia A, C: Lupus anticoagulant, D: Protein C deficiency, E: Von Willebrand disease}
Answer:
"""
med_output5 = med_pipeline(response4)
med_output5

[{'generated_text': "Answer the question using the context below.\nContext: A 20-year-old woman presents with menorrhagia for the past several years. She says that her menses “have always been heavy”, and she has experienced easy bruising for as long as she can remember. Family history is significant for her mother, who had similar problems with bruising easily. The patient's vital signs include: heart rate 98/min, respiratory rate 14/min, temperature 36.1°C (96.9°F), and blood pressure 110/87 mm Hg. Physical examination is unremarkable. Laboratory tests show the following: platelet count 200,000/mm3, PT 12 seconds, and PTT 43 seconds.\nQuestion: Which of the following is the most likely cause of this patient’s symptoms? Options: {A: Factor V Leiden, B: Hemophilia A, C: Lupus anticoagulant, D: Protein C deficiency, E: Von Willebrand disease}\nAnswer:\nE"}]

In [13]:
response5 = """Answer the question using the context below.
Context: A 40-year-old zookeeper presents to the emergency department complaining of severe abdominal pain that radiates to her back, and nausea. The pain started 2 days ago and slowly increased until she could not tolerate it any longer. Past medical history is significant for hypertension and hypothyroidism. Additionally, she reports that she was recently stung by one of the zoo’s smaller scorpions, but did not seek medical treatment. She takes aspirin, levothyroxine, oral contraceptive pills, and a multivitamin daily. Family history is noncontributory. Today, her blood pressure is 108/58 mm Hg, heart rate is 99/min, respiratory rate is 21/min, and temperature is 37.0°C (98.6°F). On physical exam, she is a well-developed, obese female that looks unwell. Her heart has a regular rate and rhythm. Radial pulses are weak but symmetric. Her lungs are clear to auscultation bilaterally. Her lateral left ankle is swollen, erythematous, and painful to palpate. An abdominal CT is consistent with acute pancreatitis.
Question: Which of the following is the most likely etiology for this patient’s disease? Options: {A: Aspirin, B: Oral contraceptive pills, C: Scorpion sting, D: Hypothyroidism, E: Obesity}
Answer:
"""
med_output6 = med_pipeline(response5)
med_output6

[{'generated_text': 'Answer the question using the context below.\nContext: A 40-year-old zookeeper presents to the emergency department complaining of severe abdominal pain that radiates to her back, and nausea. The pain started 2 days ago and slowly increased until she could not tolerate it any longer. Past medical history is significant for hypertension and hypothyroidism. Additionally, she reports that she was recently stung by one of the zoo’s smaller scorpions, but did not seek medical treatment. She takes aspirin, levothyroxine, oral contraceptive pills, and a multivitamin daily. Family history is noncontributory. Today, her blood pressure is 108/58 mm Hg, heart rate is 99/min, respiratory rate is 21/min, and temperature is 37.0°C (98.6°F). On physical exam, she is a well-developed, obese female that looks unwell. Her heart has a regular rate and rhythm. Radial pulses are weak but symmetric. Her lungs are clear to auscultation bilaterally. Her lateral left ankle is swollen, eryt