In [1]:
import pandas as pd
from bs4 import BeautifulSoup
import requests

def scrape_healthline(url, index):
    html_text = requests.get(url)
    soup = BeautifulSoup(html_text.content, 'lxml')

    Title_element = soup.find('div', class_='css-z468a2')
    Title = Title_element.h1.text if Title_element else None

    Link = url

    img_element = soup.find('picture', class_='css-16pk1is')
    imgurl = img_element.img['src'][2:] if img_element else None

    Content_element = soup.find('article', class_='article-body css-d2znx6 undefined')
    Content = Content_element.text if Content_element else None

    HtmlContent = Content_element if Content_element else None

    return {
        'Index': index,
        'Title': Title,
        'Link': Link,
        'Image URL': imgurl,
        'Content': Content,
        'HTML Content': str(HtmlContent),
        'Date Fetched': pd.to_datetime('today').strftime('%Y-%m-%d')
    }

# List of URLs
urls = [
    'https://www.healthline.com/health/developmental-delay',
    'https://www.healthline.com/health/autism',
    'https://www.healthline.com/health/autism/signs-of-autism-in-babies?utm_source=ReadNext',
    'https://www.healthline.com/health/types-of-autism?utm_source=ReadNext',
    'https://www.healthline.com/health/aspergers-vs-autism',
    'https://www.healthline.com/health/autism/how-to-eat-if-youre-autistic?utm_source=ReadNext',
    'https://www.healthline.com/health/autism/is-autism-a-disability?utm_source=ReadNext',
    'https://www.healthline.com/health/autism/autism-misdiagnosis?utm_source=ReadNext',
    'https://www.healthline.com/health/autism-treatment?utm_source=ReadNext',
    'https://www.healthline.com/health-news/does-screen-time-cause-developmental-delays-in-young-children',
    'https://www.healthline.com/health/childrens-health/stages-of-child-development',
    'https://www.healthline.com/health/adhd/parenting-tips',
    'https://www.healthline.com/health/adhd/is-adhd-a-disability',
    'https://www.healthline.com/health/adhd/who-diagnoses-adhd#who-can-diagnose',
    'https://www.healthline.com/health/down-syndrome'
]

data = []

for index, url in enumerate(urls, start=1):
    result = scrape_healthline(url, index)
    data.append(result)

df = pd.DataFrame(data, columns=['Index', 'Title', 'Link', 'Image URL', 'Content', 'HTML Content', 'Date Fetched'])
print(df)

    Index                                              Title  \
0       1    What You Need to Know About Developmental Delay   
1       2  Everything You Need to Know About Autism Spect...   
2       3  Signs of Autism in Babies: A Simple Guide to D...   
3       4               Are There Different Types of Autism?   
4       5  What’s the Difference Between Asperger’s and A...   
5       6              Your Guide to Eating Well with Autism   
6       7                 Is Autism Considered a Disability?   
7       8                 How Common Is Autism Misdiagnosis?   
8       9                             Autism Treatment Guide   
9      10  Excessive Screen Time for Kids Can Cause Devel...   
10     11  Ages and Stages: How to Monitor Child Development   
11     12           Parenting Tips for ADHD: Do’s and Don’ts   
12     13                          ADHD: Is It a Disability?   
13     14                                Who Diagnoses ADHD?   
14     15                               

In [2]:
df.to_csv('HealthLine.csv', index = False)