In [1]:
import requests
from bs4 import BeautifulSoup

In [2]:
def scrape_url_content(url: str) -> str:
    """
    Scrapes the content of a given URL and returns it as a single string.

    Args:
        url (str): The URL of the webpage to scrape.

    Returns:
        str: The textual content of the webpage.
    """
    headers = {
        "User-Agent": (
            "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 "
            "(KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36"
        )
    }

    try:
        # Send a GET request to the URL with headers
        response = requests.get(url, headers=headers, timeout=10)
        response.raise_for_status()  # Raise an HTTPError for bad responses (4xx and 5xx)

        # Parse the HTML content using BeautifulSoup
        soup = BeautifulSoup(response.text, 'html.parser')

        # Extract text content from the webpage
        content = soup.get_text(separator='\\n', strip=True)

        return content

    except requests.exceptions.RequestException as e:
        return f"An error occurred while fetching the URL: {e}"


In [None]:
# Example usage
url = "https://www.forbes.com/sites/dereksaul/2025/01/28/deepseek-panic-live-updates-nvidia-stock-makes-history-again-with-260-billion-rebound/"
print(scrape_url_content(url))

In [None]:
# Example usage
url = "https://www.hopkinsmedicine.org/health/treatment-tests-and-therapies/back-spine-surgery"
print(scrape_url_content(url))

In [None]:
# Example usage
url = "https://www.y-yin.io/"
print(scrape_url_content(url))