In [87]:
from bs4 import BeautifulSoup
import requests
import pandas as pd
import numpy as np

In [95]:
# Function to extract Product Title
def get_title(soup):

    try:
        # Outer Tag Object
        title = soup.find("p", attrs={"class":'legende'})
            
        # Inner NavigatableString Object
        title_value = title.text

        # Title as a string value
        title_string = title_value.strip()

    except AttributeError:
        title_string = ""

    return title_string

# Function to extract Product Price
def get_price(soup):

    try:
        price = soup.find("span", attrs={'class':'dyn_prod_price product__price--new'}).string.strip()

    except AttributeError:

        try:
            # If there is some deal price
            price = soup.find("span", attrs={'id':'priceblock_dealprice'}).string.strip()

        except:
            price = ""

    return price


# Function to extract Number of User Reviews
def get_review_count(soup):
    try:
        review_count = soup.find("a", attrs={'href':'#com'}).string.strip()

    except AttributeError:
        review_count = ""	

    return review_count

# Function to extract Availability Status
def get_availability(soup):
    try:
        available = soup.find("p", attrs={'class':'dyn_prod_avaibility product__stock product__stock--stock'})
        available = available.find("span").string.strip()

    except AttributeError:
        available = "Not Available"	

    return available



In [97]:

if __name__ == '__main__':

    # add your user agent 
    HEADERS = ({'User-Agent':'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/114.0.0.0 Safari/537.36', 'Accept-Language': 'en-US, en;q=0.5'})

    # The webpage URL
    URL = "https://www.rueducommerce.fr/r/telephones.html"

    # HTTP Request
    webpage = requests.get(URL, headers=HEADERS)

    # Soup Object containing all data
    soup = BeautifulSoup(webpage.content, "html.parser")

    # Fetch links as List of Tag Objects
    links = soup.find_all("a", attrs={'class':'item__image'})

    # Store the links
    links_list = []

    # Loop for extracting links from Tag Objects
    for link in links:
            links_list.append(link.get('href'))

    d = {"title":[], "price":[], "rating":[], "reviews":[],"availability":[]}
    
    # Loop for extracting product details from each link 
    for link in links_list:
        new_webpage = requests.get("https://www.rueducommerce.fr" + link, headers=HEADERS)

        new_soup = BeautifulSoup(new_webpage.content, "html.parser")

        # Function calls to display all necessary product information
        d['title'].append(get_title(new_soup))
        d['price'].append(get_price(new_soup))
        d['rating'].append(get_rating(new_soup))
        d['reviews'].append(get_review_count(new_soup))
        d['availability'].append(get_availability(new_soup))

    
    rueducommerce = pd.DataFrame.from_dict(d)
    rueducommerce['title'].replace('', np.nan, inplace=True)
    rueducommerce = rueducommerce.dropna(subset=['title'])
    rueducommerce.to_csv("rueducommerce_data.csv", header=True, index=False)


In [94]:
new_soup

<!DOCTYPE html>

<html id="rdc" lang="fr">
<head>
<title>Fisher Price - LE TELEPHONE ANIME - FGW66 - Jeux d'éveil - Rue du Commerce</title>
<meta charset="utf-8"/>
<meta content="Achetez votre Fisher Price LE TELEPHONE ANIME - FGW66 et retrouvez toute la selection de Jeux d'éveil Fisher Price sur Rue du Commerce au meilleur prix." name="description"/>
<meta content="width=device-width, initial-scale=1, user-scalable=0" name="viewport"/>
<meta content="Rue du commerce, hightech, high-tech, ordinateur, maison connectee, objet connecte, informatique, gaming, telephone, meubles, petit electromenager, jardin, pack location, pack revente" name="keywords"/>
<meta content="max-image-preview:large" name="robots"/>
<meta content="PQQOAbxOqmKoz0GP_75unXw0PPo7eD39WzxkAcj-4w0" name="google-site-verification">
<meta content="ycaWidt1t6sfnwRYevEg41yKv2LP3D6V6RJBpEiEDiU" name="google-site-verification">
<meta content="Achetez votre Fisher Price LE TELEPHONE ANIME - FGW66 et retrouvez toute la selectio

In [96]:
get_title(new_soup)

'LE TELEPHONE ANIME - FGW66'

In [98]:
rueducommerce

Unnamed: 0,title,price,rating,reviews,availability
0,Sony Xperia Z2 - Qualcomm snapdragon - 16 Go -...,24890.0,,39 Avis,Not Available
1,Crosscall Crosscall Core-X5,44032.0,,,Not Available
2,SAMSUNG Smartphone Galaxy S22 5G Noir EE 8 Go ...,,,,Not Available
3,doro - téléphone duo sans fil mains-libres dec...,5489.0,,,Not Available
4,DESIGNATION REF PHILIPS42,11191.0,,,Not Available
5,DESIGNATION REF PHILIPS43,10502.0,,,Not Available
6,3S 850VA 510W ONDULEUR OFF,,,,Not Available
7,Téléphone sans fil Senior Doro PhoneEasy® 100w...,6179.0,,,Not Available
8,Prise parafoudre 8 prises + Protection Vidéo +...,,,,Not Available
9,Adaptateur USB WiFi bi-bande AC 600 Mbps à gai...,,,,Not Available
