<a href="https://colab.research.google.com/github/folukeOpenuni/AI-Python/blob/master/covidResearch.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

In [1]:
!pip install requests beautifulsoup4 biopython


Collecting biopython
  Downloading biopython-1.83-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (3.1 MB)
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m3.1/3.1 MB[0m [31m31.5 MB/s[0m eta [36m0:00:00[0m
Installing collected packages: biopython
Successfully installed biopython-1.83


In [2]:
import requests
from bs4 import BeautifulSoup
from Bio import Entrez, Medline
import pandas as pd

In [5]:
Entrez.email = "folukeagbede@hotmail.com"

def search_pubmed(query, max_results=100):
    handle = Entrez.esearch(db="pubmed", term=query, retmax=max_results)
    record = Entrez.read(handle)
    handle.close()
    return record['IdList']

def fetch_details(id_list):
    ids = ",".join(id_list)
    handle = Entrez.efetch(db="pubmed", id=ids, rettype="medline", retmode="text")
    records = handle.read()
    handle.close()
    return records

def parse_medline(details):
    records = Medline.parse(details.splitlines())
    articles = []
    for record in records:
        article = {
            'Title': record.get('TI', ''),
            'Abstract': record.get('AB', ''),
            'DOI': record.get('LID', '').split()[0] if 'LID' in record else '',
            'Authors': ', '.join(record.get('AU', []))
        }
        articles.append(article)
    return articles

query = "SARS-CoV-2"
ids = search_pubmed(query)
details = fetch_details(ids)
articles = parse_medline(details)

# Convert list of articles to DataFrame
df = pd.DataFrame(articles)
print(df)


                                                Title  \
0   Efficient signal sequence of mRNA vaccines enh...   
1   Diverse roles of SARS-CoV-2 Spike and Nucleoca...   
2   Vertical transmission of SARS-CoV-2 delta-vari...   
3   Management of immunosuppression in lung transp...   
4   Neutralizing antibody responses and cellular r...   
..                                                ...   
95  Diabetes Following COVID-19 Infection: Is It C...   
96  Scleroderma Cardiac Crisis triggered by SARS-C...   
97  Long-term wastewater monitoring of SARS-CoV-2 ...   
98  Early, rapidly progressive vasculopathy in a t...   
99  Development of antibody levels and subsequent ...   

                                             Abstract  \
0   The signal sequence played a crucial role in t...   
1   BACKGROUND: The SARS-CoV-2 virus causes severe...   
2   BACKGROUND: As SARS-CoV-2 continues to be rele...   
3   BACKGROUND: The aim of this study was to asses...   
4   Although the mRNA SARS-CoV

In [6]:
df.head(10)

Unnamed: 0,Title,Abstract,DOI,Authors
0,Efficient signal sequence of mRNA vaccines enh...,The signal sequence played a crucial role in t...,10.1186/s12951-024-02488-3,"Zhang Y, Zhai S, Huang H, Qin S, Sun M, Chen Y..."
1,Diverse roles of SARS-CoV-2 Spike and Nucleoca...,BACKGROUND: The SARS-CoV-2 virus causes severe...,10.1186/s12964-024-01665-z,"Ciszewski WM, Wozniak LA, Sobierajska K"
2,Vertical transmission of SARS-CoV-2 delta-vari...,BACKGROUND: As SARS-CoV-2 continues to be rele...,10.1186/s12879-024-09420-y,"Zia MTK, Kumar K, Gamma E, Shakeel F, Hanna I,..."
3,Management of immunosuppression in lung transp...,BACKGROUND: The aim of this study was to asses...,10.1186/s12879-024-09269-1,"Bes-Berlandier H, Coiffard B, Bermudez J, Dema..."
4,Neutralizing antibody responses and cellular r...,Although the mRNA SARS-CoV-2 vaccine has impro...,10.1038/s41598-024-63147-z,"Kawashiro K, Suzuki R, Nogimori T, Tsujino S, ..."
5,SARS-CoV-2 detection in pediatric dental clini...,This was the first longitudinal study to analy...,10.1038/s41598-024-63020-z,"Kanamori D, Sakai J, Iijima T, Oono Y, Malla B..."
6,PMMA dialyzers modulate both humoral and cell-...,Patients on hemodialysis (HD) have a high risk...,10.1038/s41598-024-62044-9,"Castellano G, Netti GS, Cantaluppi V, Losappio..."
7,A comprehensive analysis of COVID-19 nonlinear...,This research conducts a detailed analysis of ...,10.1038/s41598-024-61730-y,"Riaz M, Shah K, Abdeljawad T, Amacha I, Al-Jas..."
8,SARS-CoV-2-specific immune responses converge ...,"Healthy individuals with hybrid immunity, due ...",10.1038/s41541-024-00886-0,"Aguilar-Bretones M, den Hartog Y, van Dijk LLA..."
9,Vaccination status and self-reported side effe...,The recent SARS-CoV-2 pandemic and the vaccina...,10.1038/s41598-024-62541-x,"Burian K, Heidler F, Frahm N, Hecker M, Langho..."
