In [61]:
# 1. Extract Text Data:

import requests 
from bs4 import BeautifulSoup 
import csv 

url = "https://www.baraasallout.com/test.html"
response = requests.get(url)
if response.status_code == 200:
    
    soup = BeautifulSoup(response.text, "html.parser")
    
    headings = soup.find_all(['h1','h2'])
   
    paragraphs = soup.find_all('p')
    list_items = soup.find_all('li')
    

    text_data = []
    for tag in (headings + paragraphs + list_items):
        text_data.append({
            "type": tag.name, 
            "content": tag.get_text(strip=True) 
        })

    with open("Extract_Text_Data.csv", mode="w", newline="", encoding="utf-8") as csv_file:
        writer = csv.DictWriter(csv_file, fieldnames=["type", "content"])
        writer.writeheader() 
        writer.writerows(text_data) 

    print("Text data has been extracted and saved to the file: Extract_Text_Data.csv")
else:
    print("Failed to fetch the page. Status code:", response.status_code)


Text data has been extracted and saved to the file: Extract_Text_Data.csv


In [74]:
#2. Extract Table Data:
import requests
from bs4 import BeautifulSoup 
import csv 

url = "https://www.baraasallout.com/test.html"

response = requests.get(url)
if response.status_code == 200:
    
    soup = BeautifulSoup(response.text, "html.parser")

    table = soup.find("table") 

    if table:
        headers = [header.get_text(strip=True) for header in table.find_all("th")]
 
        rows = []
        for row in table.find_all("tr")[1:]: 
            columns = [col.get_text(strip=True) for col in row.find_all("td")]
            rows.append(dict(zip(headers, columns)))
    
        with open("Extract_Table_Data.csv", mode="w", newline="", encoding="utf-8") as csv_file:
            writer = csv.DictWriter(csv_file, fieldnames=headers)
            writer.writeheader() 
            writer.writerows(rows) 

        print("Table data has been extracted and saved to the file: Extract_Table_Data.csv")
    else:
        print("No table found in the page.")
else:
    print("Failed to fetch the page. Status code:", response.status_code)


Table data has been extracted and saved to the file: Extract_Table_Data.csv


In [76]:
#3. Extract Product Information (Cards Section):
import requests
from bs4 import BeautifulSoup
import json

url = "https://www.baraasallout.com/test.html"
response = requests.get(url)
if response.status_code == 200:
    
    soup = BeautifulSoup(response.text, "html.parser")
    
    cards = soup.find_all(class_="book-card") 
    
    product_info = []
    
    for card in cards:
        title = card.find(class_="title").get_text(strip=True) if card.find(class_="title") else "N/A"
        price = card.find(class_="price").get_text(strip=True) if card.find(class_="price") else "N/A"
        stock_status = card.find(class_="stock-status").get_text(strip=True) if card.find(class_="stock-status") else "N/A"
        button_text = card.find("button").get_text(strip=True) if card.find("button") else "N/A"
        
        product_info.append({
            "Book Title": title,
            "Price": price,
            "Stock Availability": stock_status,
            "Button Text": button_text
        })
    
    with open("Product_Information.json", mode="w", encoding="utf-8") as json_file:
        json.dump(product_info, json_file, indent=4)

    print("The data has been extracted and saved to the file: Product_Information.json")
else:
    print("Failed to load the page.")


The data has been extracted and saved to the file: Product_Information.json


In [78]:
#4. Extract Form Details:
import requests
from bs4 import BeautifulSoup
import json

url = "https://www.baraasallout.com/test.html"
response = requests.get(url)

if response.status_code == 200:
    soup = BeautifulSoup(response.text, "html.parser")
    forms = soup.find_all("form")

    form_details = [{
        "Field Name": input_tag.get("name", "N/A"),
        "Input Type": input_tag.get("type", "N/A"),
        "Default Value": input_tag.get("value", "N/A")
    } for form in forms for input_tag in form.find_all("input")]
    
    with open("Form_Details.json", "w", encoding="utf-8") as json_file:
        json.dump(form_details, json_file, indent=4)

    print("Form details have been extracted and saved to the file: Form_Details.json")
else:
    print("Failed to load the page.")


Form details have been extracted and saved to the file: Form_Details.json


In [80]:
#5. Extract Links and Multimedia:
import requests
from bs4 import BeautifulSoup
import json

url = "https://www.baraasallout.com/test.html"
response = requests.get(url)
if response.status_code == 200:
    soup = BeautifulSoup(response.text, "html.parser")
    
    links = [{"link_text": a.get_text(strip=True), "href": a.get("href", "N/A")} for a in soup.find_all("a")]
    
    iframes = [{"video_url": iframe.get("src", "N/A")} for iframe in soup.find_all("iframe")]

    data = {"links": links, "videos": iframes}
    
    with open("Links_and_Multimedia.json", "w", encoding="utf-8") as json_file:
        json.dump(data, json_file, indent=4)

    print("Links and multimedia content have been extracted and saved to the file: Links_and_Multimedia.json")
else:
    print("Failed to load the page.")


Links and multimedia content have been extracted and saved to the file: Links_and_Multimedia.json


In [82]:
import requests
from bs4 import BeautifulSoup
import json

url = "https://www.baraasallout.com/test.html"
response = requests.get(url)

if response.status_code == 200:

    soup = BeautifulSoup(response.text, "html.parser")
    
    products = soup.select(".featured-products .product-card")
    
    featured_products = []
    for product in products:
        product_id = product.get("data-id", "N/A")  
        product_name = product.find("span", class_="name").get_text(strip=True, default="N/A")  
        product_price = product.find("span", class_="price", style="display: none;").get_text(strip=True, default="N/A")  
        product_colors = product.find("span", class_="colors").get_text(strip=True, default="N/A") 
        
        featured_products.append({
            "id": product_id,
            "name": product_name,
            "price": product_price,
            "colors": product_colors
        })
    
    with open("Featured_Products.json", "w", encoding="utf-8") as json_file:
        json.dump(featured_products, json_file, indent=4)

    print("Data has been successfully extracted and saved to 'Featured_Products.json'.")
else:
    print("Failed to load the webpage.")


Data has been successfully extracted and saved to 'Featured_Products.json'.
