In [1]:
# Import necessaeries libraries
import requests
from bs4 import BeautifulSoup
import pandas as pd

In [2]:
# Define the base URL and headers
base_url = "https://genzmarketing.xyz/"
headers = {"User-Agent": "Mozilla/5.0"}

In [3]:
# Fetch the main page content
response = requests.get(base_url, headers=headers)
if response.status_code == 200:
    soup = BeautifulSoup(response.text, 'html.parser')
else:
    print(f"Failed to fetch the website: {response.status_code}")
    exit()

In [4]:
# Extract links to articles/pages
articles = []
for link in soup.find_all('a', href=True):
    url = link['href']
    if url.startswith('/'): 
        url = base_url + url.lstrip('/')
    if base_url in url:
        articles.append(url)

In [5]:
# Extract content from each article
data = []
for article_url in set(articles):  # For Avoid duplicates
    try:
        article_response = requests.get(article_url, headers=headers)
        if article_response.status_code == 200:
            article_soup = BeautifulSoup(article_response.text, 'html.parser')
            title = article_soup.title.string if article_soup.title else "No Title"
            content = " ".join(p.text for p in article_soup.find_all('p'))  # Extract paragraphs
            data.append({"title": title, "url": article_url, "content": content})
    except Exception as e:
        print(f"Error fetching {article_url}: {e}")

In [6]:
# Save to CSV
df = pd.DataFrame(data)
df.to_csv('genzmarketing_data.csv', index=False)
print("Data scraping complete. Saved as genzmarketing_data.csv.")

Data scraping complete. Saved as genzmarketing_data.csv.


In [7]:
# Check CSV file
data = pd.read_csv("genzmarketing_data.csv")
# print(data)
data.head(5)


Unnamed: 0,title,url,content
0,The Neurodivergent Business Consortium (NB...,https://genzmarketing.xyz/blog/the-neurodiverg...,Loading... I was a very odd child to many peop...
1,,https://genzmarketing.xyz/service-CT,Loading... We know training and specific subje...
2,Cold Email Marketing| Portfolio\r\n,https://genzmarketing.xyz/portfolio/category/e...,Loading... Why is cold email marketing servic...
3,Video Advertisement| Portfolio\r\n,https://genzmarketing.xyz/portfolio/category/e...,Loading... Theme-based Video Advertisement F...
4,How Lead Generation Works? ( GenZMarketing...,https://genzmarketing.xyz/blog/how-lead-genera...,Loading... Lead generation is the process of a...
