In [None]:
!pip install transformers




In [None]:
import torch
from transformers import BioGptTokenizer, BioGptForCausalLM, set_seed

tokenizer = BioGptTokenizer.from_pretrained("microsoft/biogpt")
model = BioGptForCausalLM.from_pretrained("microsoft/biogpt")

sentence = "Axial T1-weighted MRI scan of the brain showing a mass in the left frontal lobe."
inputs = tokenizer(sentence, return_tensors="pt")

set_seed(42)

with torch.no_grad():
    beam_output = model.generate(**inputs,
                                min_length=100,
                                max_length=1024,
                                num_beams=5,
                                early_stopping=True
                                )
tokenizer.decode(beam_output[0], skip_special_tokens=True)

'Axial T1-weighted MRI scan of the brain showing a mass in the left frontal lobe., T2-weighted MRI scan showing a mass in the right frontal lobe, and contrast-enhanced T1-weighted MRI scan showing a mass in the left frontal lobe, were performed in order to evaluate the extent of the tumor and to determine the relationship between the tumor and the surrounding brain tissue, and the tumor was surgically removed by means of a left frontal craniotomy and partial removal of the tumor in the left frontal lobe.'

In [None]:
!pip install spacy
!python -m spacy download en_core_web_sm


Collecting en-core-web-sm==3.7.1
  Downloading https://github.com/explosion/spacy-models/releases/download/en_core_web_sm-3.7.1/en_core_web_sm-3.7.1-py3-none-any.whl (12.8 MB)
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m12.8/12.8 MB[0m [31m68.3 MB/s[0m eta [36m0:00:00[0m
[38;5;2m✔ Download and installation successful[0m
You can now load the package via spacy.load('en_core_web_sm')
[38;5;3m⚠ Restart to reload dependencies[0m
If you are in a Jupyter or Colab notebook, you may need to restart Python in
order to load all the package's dependencies. You can do this by selecting the
'Restart kernel' or 'Restart runtime' option.


In [None]:
import spacy

# Load spaCy's English model
nlp = spacy.load("en_core_web_sm")

# The generated text (for demonstration, the same output you've shared)
generated_text = """
Axial T1-weighted MRI scan of the brain showing a mass in the left frontal lobe, T2-weighted MRI scan showing a mass in the right frontal lobe, and contrast-enhanced T1-weighted MRI scan showing a mass in the left frontal lobe, were performed in order to evaluate the extent of the tumor and to determine the relationship between the tumor and the surrounding brain tissue, and the tumor was surgically removed by means of a left frontal craniotomy and partial removal of the tumor in the left frontal lobe.
"""

# Process the text with spaCy to identify key phrases and words
doc = nlp(generated_text)

# Extract main nouns and noun phrases for keywords
keywords = [chunk.text for chunk in doc.noun_chunks]
unique_keywords = list(set(keywords))  # Remove duplicates

print("Main Words and Phrases:", unique_keywords)


Main Words and Phrases: ['a left frontal craniotomy', ', T2-weighted MRI scan', 'contrast-enhanced T1-weighted MRI scan', 'the relationship', 'the right frontal lobe', 'the tumor', '\nAxial T1-weighted MRI scan', 'the extent', 'partial removal', 'means', 'a mass', 'the surrounding brain tissue', 'the brain', 'the left frontal lobe', 'order']
