# Playwright setup 

Set up a standard playwright headless browser with the stealth plug-in. Go to a page and download it. 

First let's import the needed packages.

In [2]:
import os
import asyncio
from playwright.async_api import async_playwright
from playwright_stealth import stealth_async

import nest_asyncio
nest_asyncio.apply()

## Set up a browser and navigate to a page

Below is a standard function that uses Playwright to open a browser and navigate to a page. It then saves said page to the data folder. Note that on the first run of this script, Playwright might ask you to install some browsers.

In [4]:
page_name = "google"
data_folder = "data"

async def scrape_all(headless=True):
    async with async_playwright() as p:
        browser = await p.firefox.launch(headless=headless)
        context = await browser.new_context()
        page = await context.new_page()
        await stealth_async(page)

        await page.goto("https://google.nl")
        await page.wait_for_timeout(3000)

        html_content = await page.content()

        file_name = f"../{data_folder}/{page_name}.html"
        with open(file_name, 'w', encoding='utf-8') as file:
            file.write(html_content)

        await browser.close()

asyncio.run(scrape_all(headless=True))