In [1]:
import os
import json
import boto3
import shutil
from bing_image_downloader import downloader
from tqdm import tqdm
import cv2

In [2]:
def download_images(actor, num_imgs, img_size):
    output_dir = 'temp_imagens'
    shutil.rmtree(output_dir, )
    actor_name_formatted = actor.lower().replace(' ', '_')

    downloader.download(actor, limit=num_imgs, output_dir=output_dir, adult_filter_off=True, force_replace=False, timeout=60)

    old_dir = os.path.join(output_dir, actor)
    new_dir = os.path.join(output_dir, actor_name_formatted)
    os.rename(old_dir, new_dir)
        
    downloaded_images = os.listdir(new_dir)
    for i, img_name in enumerate(downloaded_images):
        old_path = os.path.join(new_dir, img_name)
        new_path = os.path.join(new_dir, img_name)
        
        # Verifica se a imagem contém um rosto
        if not has_face(new_path):
            os.remove(new_path)  # Remove a imagem se não contiver um rosto
            print("Remove image: " + new_path)
        
        
def has_face(img_path):
    if img_path.lower().endswith('.gif'):
        return False;

    # Carrega a imagem usando OpenCV
    image = cv2.imread(img_path)

    # Inicializa o detector de rosto Haar Cascade
    face_cascade = cv2.CascadeClassifier(cv2.data.haarcascades + 'haarcascade_frontalface_default.xml')

    # Converte a imagem para escala de cinza
    print(img_path)
    gray = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)

    # Detecta rostos na imagem
    faces = face_cascade.detectMultiScale(gray, scaleFactor=1.1, minNeighbors=5, minSize=(30, 30))

    # Retorna True se um rosto for detectado, False caso contrário
    return len(faces) > 0

        
def upload_s3(actor):
    session = boto3.Session()
    
    s3 = session.client("s3")
    bucket_name = "seekinglost-dados-treino-raw"
    actor_path = f"temp_imagens/{actor}"

    for item in tqdm(os.listdir(actor_path)):
        item_path = os.path.join(actor_path, item)
        
        if os.path.isfile(item_path):  # Verifica se é um arquivo
            img_name = os.path.basename(item_path)
            s3.upload_file(item_path, bucket_name, f"{actor}/{img_name}")
            
            
def main(list_actors, num_imgs, img_size):
    if not os.path.exists('temp_imagens'):
        os.makedirs('temp_imagens')

    for actor in list_actors:
        download_images(actor, num_imgs, img_size)
        actor_name_formatted = actor.lower().replace(' ', '_')
        upload_s3(actor_name_formatted)

    shutil.rmtree('temp_imagens')

In [7]:
if __name__ == '__main__':
    with open('parameters_crawler.json', 'r') as file:
        actors = json.load(file)
    list_actors = list(actors.keys())
    del actors

    img_size = "large"  # Este parâmetro será ignorado, mas mantido para consistência
    
    main(list_actors, 25, img_size)

[%] Downloading Images to /opt/jupyter/notebook/web_scraping/temp_imagens/actors


[!!]Indexing page: 1

[%] Indexed 25 Images on Page 1.


[%] Downloading Image #1 from https://www.pouted.com/wp-content/uploads/2015/04/chris-pine.jpg?x45357
[%] File Downloaded !

[%] Downloading Image #2 from http://images6.fanpop.com/image/polls/1516000/1516348_1444854346844_full.jpg?v=1444854363
[%] File Downloaded !

[%] Downloading Image #3 from https://cf.girlsaskguys.com/q4042656/b7ef090d-144d-4c71-af26-4b44cd18260e.jpg
[%] File Downloaded !

[%] Downloading Image #4 from http://img-cdn.brainberries.co/wp-content/uploads/2016/03/british_actors_currently_rocking_hollywood_17.jpg
[%] File Downloaded !

[%] Downloading Image #5 from https://i.pinimg.com/originals/9d/71/e4/9d71e445c632a8a173e9e6fd27c476e3.jpg
[%] File Downloaded !

[%] Downloading Image #6 from https://www.pouted.com/wp-content/uploads/2015/04/ian-somerhalder-hd-wallpapers-1.jpg?x45357
[%] File Downloaded !

[%] Downloading Image #7

100%|██████████| 24/24 [00:02<00:00, 11.16it/s]


In [3]:
file_name = "list_actors.json"
actors = []

# Ler o conteúdo do arquivo de texto de volta para um array de strings
with open(file_name, "r") as file:
    actors = file.read().splitlines()

# Exibir o array de strings
print(actors)

if __name__ == '__main__':
    img_size = "large"  # Este parâmetro será ignorado, mas mantido para consistência
    
    main(actors, 100, img_size)

['Vin Diesel', 'Henry Cavill', 'Chris Hemsworth', 'Bruce Willis', 'Sandra Bullock', 'Bradley Cooper', 'Tom Hardy']
[%] Downloading Images to /opt/jupyter/notebook/web_scraping/temp_imagens/Vin Diesel


[!!]Indexing page: 1

[%] Indexed 35 Images on Page 1.


[%] Downloading Image #1 from https://therecenttimes.com/wp-content/uploads/2023/12/Vin-Diesel.webp
[%] File Downloaded !

[%] Downloading Image #2 from https://www.usatoday.com/gcdn/authoring/videos/videoelephant/thumbnails/72011062007.jpg?width=NaN&amp;disable=upscale&amp;format=pjpg&amp;auto=webp
[%] File Downloaded !

[%] Downloading Image #3 from https://www.comingsoon.net/wp-content/uploads/sites/3/2023/12/vin-diesel-header-1.jpg
[%] File Downloaded !

[%] Downloading Image #4 from https://www.comingsoon.net/wp-content/uploads/sites/3/2023/05/vin-diesel-header-1.png
[%] File Downloaded !

[%] Downloading Image #5 from https://media.philstar.com/photos/2023/09/01/vin-diesel_2023-09-01_12-55-07.jpg
[%] File Downloaded !

[%] Do

[%] File Downloaded !

[%] Downloading Image #47 from http://photos.laineygossip.com/articles/vin-diesel-25jul14-01.jpg
[%] File Downloaded !

[%] Downloading Image #48 from https://getinfolist.com/wp-content/uploads/2016/01/3631198-fast-9.jpg
[%] File Downloaded !

[%] Downloading Image #49 from http://1.bp.blogspot.com/-FhNOi3nP4Qo/UHu8DZJMYpI/AAAAAAAAAno/8Xh0_ih7lAs/s1600/Vin_Diesel_11.jpg
[%] File Downloaded !

[%] Downloading Image #50 from http://yesgulf.com/wp-content/uploads/2015/04/vin-diesel-1.jpg
[Error]Invalid image, not saving http://yesgulf.com/wp-content/uploads/2015/04/vin-diesel-1.jpg

[!] Issue getting: http://yesgulf.com/wp-content/uploads/2015/04/vin-diesel-1.jpg
[!] Error:: Invalid image, not saving http://yesgulf.com/wp-content/uploads/2015/04/vin-diesel-1.jpg

[%] Downloading Image #50 from http://3.bp.blogspot.com/-GE4yzHnDpgA/UrSdPmm2OhI/AAAAAAAAaZo/C9MSDiWCM3I/s1600/Vin+Diesel+is+a.jpg
[%] File Downloaded !

[%] Downloading Image #51 from http://www.aceshowbiz

[%] File Downloaded !

[%] Downloading Image #86 from https://i.dailymail.co.uk/1s/2022/07/18/14/60401665-11024785-image-m-46_1658151807123.jpg
[%] File Downloaded !

[%] Downloading Image #87 from https://cdn.amomama.com/fbef1393b3d50423d925371d03894a04.jpg
[%] File Downloaded !

[%] Downloading Image #88 from https://pics.craiyon.com/2023-11-01/81e6685e95664515ac2e7cbd4782f756.webp
[%] File Downloaded !

[%] Downloading Image #89 from https://images.wallpapersden.com/image/download/ark-2-vin-diesel-character_bmVuZWqUmZqaraWkpJRnamtlrWZpaWU.jpg
[%] File Downloaded !

[%] Downloading Image #90 from https://www.lamansiondelasideas.com/wp-content/uploads/2022/10/casa-Vin-Diesel.jpg
[%] File Downloaded !

[%] Downloading Image #91 from https://www.usmagazine.com/wp-content/uploads/2022/11/is-vin-diesel-married-everything-to-know-about-gf-paloma-jimenez-01.jpg?quality=70&amp;strip=all
[%] File Downloaded !

[%] Downloading Image #92 from https://s43365.pcdn.co/wp-content/uploads/2023/12/Vi

100%|██████████| 90/90 [00:07<00:00, 11.56it/s]


[%] Downloading Images to /opt/jupyter/notebook/web_scraping/temp_imagens/Henry Cavill


[!!]Indexing page: 1

[%] Indexed 35 Images on Page 1.


[%] Downloading Image #1 from https://image.tmdb.org/t/p/original/hErUwonrQgY5Y7RfxOfv8Fq11MB.jpg
[%] File Downloaded !

[%] Downloading Image #2 from http://upload.wikimedia.org/wikipedia/commons/b/ba/Henry_Cavill_at_the_2009_Tribeca_Film_Festival.jpg
[%] File Downloaded !

[%] Downloading Image #3 from http://upload.wikimedia.org/wikipedia/commons/5/53/Henry_Cavill_2013.jpg
[%] File Downloaded !

[%] Downloading Image #4 from https://www.femalefirst.co.uk/image-library/port/1000/h/henry-cavill-premiere-2---wi06-13.jpg
[%] File Downloaded !

[%] Downloading Image #5 from https://static.accessonline.com/uploads/239152.jpg
[%] File Downloaded !

[%] Downloading Image #6 from https://cdn.vox-cdn.com/thumbor/lbkd7A9zVRuEMoqGA4j25QV05X8=/1400x1400/filters:format(jpeg)/cdn.vox-cdn.com/uploads/chorus_asset/file/13047949/873854634.jpg.jpg
[%] File D

[%] File Downloaded !

[%] Downloading Image #41 from https://i1.wp.com/variety.com/wp-content/uploads/2022/12/Henry-Cavill.jpg
[%] File Downloaded !

[%] Downloading Image #42 from https://www.usmagazine.com/wp-content/uploads/2022/10/Henry-Cavill-GF-Natalie-Viscuso-Make-Red-Carpet-Debut.jpg?w=1600&amp;quality=86&amp;strip=all
[%] File Downloaded !

[%] Downloading Image #43 from https://wegotthiscovered.com/wp-content/uploads/2023/09/henry-cavill-argylle-2.jpg
[%] File Downloaded !

[%] Downloading Image #44 from https://images6.fanpop.com/image/photos/44700000/Henry-Cavill-Avatar-The-Way-of-Water-L-A-Premiere-December-12-2022-henry-cavill-44718218-1508-2048.jpg
[%] File Downloaded !

[%] Downloading Image #45 from https://wealthypeeps.com/wp-content/uploads/2023/06/239104.jpg
[%] File Downloaded !

[%] Downloading Image #46 from https://img-s-msn-com.akamaized.net/tenant/amp/entityid/AA1ncrzk.img?w=1500&amp;h=1000&amp;m=4&amp;q=60
[%] File Downloaded !

[%] Downloading Image #47 fro

[%] File Downloaded !

[%] Downloading Image #76 from https://m.media-amazon.com/images/M/MV5BM2ZiMTNmZjAtMjVjNC00NmEyLThjNGYtMTI1YWMxYzg1OGNkXkEyXkFqcGdeQXVyMTUzMTg2ODkz._V1_.jpg
[%] File Downloaded !

[%] Downloading Image #77 from https://imagez.tmz.com/image/5c/4by3/2022/10/29/5ce6743f9bd847e1ad818362fe091915_md.jpg
[%] File Downloaded !

[%] Downloading Image #78 from https://www.pinkvilla.com/images/2023-08/2038420479_image-2.jpg
[%] File Downloaded !

[%] Downloading Image #79 from https://people.com/thmb/huo-bqb3snkg8iuC7mhYisxULo0=/1500x0/filters:no_upscale():max_bytes(150000):strip_icc():focal(749x0:751x2)/henry-cavill-tout-012424-6a8cf3e2f1524d388643115150840c8b.jpg
[%] File Downloaded !

[%] Downloading Image #80 from https://averagebeing.com/wp-content/uploads/2023/01/5-Piers-Cavill.jpg
[%] File Downloaded !

[%] Downloading Image #81 from https://www.looper.com/img/gallery/this-look-at-henry-cavill-as-a-targaryen-is-truly-incredible/l-intro-1661475751.jpg
[%] File Downloa

temp_imagens/henry_cavill/Image_66.jpg
temp_imagens/henry_cavill/Image_67.jpg
temp_imagens/henry_cavill/Image_68.jpg
temp_imagens/henry_cavill/Image_69.jpg
temp_imagens/henry_cavill/Image_70.jpg
temp_imagens/henry_cavill/Image_71.jpg
temp_imagens/henry_cavill/Image_72.jpg
Remove image: temp_imagens/henry_cavill/Image_72.jpg
temp_imagens/henry_cavill/Image_73.jpg
temp_imagens/henry_cavill/Image_74.jpg
temp_imagens/henry_cavill/Image_75.jpg
temp_imagens/henry_cavill/Image_76.jpg
temp_imagens/henry_cavill/Image_77.jpg
temp_imagens/henry_cavill/Image_78.jpg
temp_imagens/henry_cavill/Image_79.jpg
temp_imagens/henry_cavill/Image_80.jpg
temp_imagens/henry_cavill/Image_81.jpg
temp_imagens/henry_cavill/Image_82.webp
temp_imagens/henry_cavill/Image_83.jpg
temp_imagens/henry_cavill/Image_84.jpg
temp_imagens/henry_cavill/Image_85.jpg
temp_imagens/henry_cavill/Image_86.jpg
temp_imagens/henry_cavill/Image_87.jpg
temp_imagens/henry_cavill/Image_88.jpg
temp_imagens/henry_cavill/Image_89.jpg
temp_image

100%|██████████| 99/99 [00:08<00:00, 11.34it/s]


[%] Downloading Images to /opt/jupyter/notebook/web_scraping/temp_imagens/Chris Hemsworth


[!!]Indexing page: 1

[%] Indexed 35 Images on Page 1.


[%] Downloading Image #1 from https://media.glamour.com/photos/569580bd8fa134644ec26222/master/pass/entertainment-2015-11-chris-hemsworth-main.jpg
[%] File Downloaded !

[%] Downloading Image #2 from https://www.usmagazine.com/wp-content/uploads/2018/12/chris-hemsworth.jpg
[%] File Downloaded !

[%] Downloading Image #3 from https://photos.laineygossip.com/articles/chris-hemsworth-vancouver-01.jpg
[%] File Downloaded !

[%] Downloading Image #4 from http://images6.fanpop.com/image/photos/36200000/Chris-Hemsworth-image-chris-hemsworth-36262564-1468-1958.jpg
[%] File Downloaded !

[%] Downloading Image #5 from https://upload.wikimedia.org/wikipedia/commons/thumb/e/e8/Chris_Hemsworth_by_Gage_Skidmore_2_(cropped).jpg/1200px-Chris_Hemsworth_by_Gage_Skidmore_2_(cropped).jpg
[Error]Invalid image, not saving https://upload.wikimedia.org/wikipedia/

[%] File Downloaded !



[!!]Indexing page: 6

[%] Indexed 35 Images on Page 6.


[%] Downloading Image #34 from http://images4.fanpop.com/image/photos/19100000/Chris-Hemsworth-chris-hemsworth-19135763-920-1222.jpg
[%] File Downloaded !



[!!]Indexing page: 7

[%] Indexed 35 Images on Page 7.


[%] Downloading Image #35 from http://thoughtsinlittleboxes.files.wordpress.com/2012/09/chris-hemsworth-chris-hemsworth-19135826-877-1222.jpeg
[!] Issue getting: http://thoughtsinlittleboxes.files.wordpress.com/2012/09/chris-hemsworth-chris-hemsworth-19135826-877-1222.jpeg
[!] Error:: HTTP Error 403: Forbidden
[%] Downloading Image #35 from http://image.tmdb.org/t/p/original/eknQXvdsLkoCdF1wQ30f5qhbkXN.jpg
[!] Issue getting: http://image.tmdb.org/t/p/original/eknQXvdsLkoCdF1wQ30f5qhbkXN.jpg
[!] Error:: HTTP Error 404: Not Found


[!!]Indexing page: 8

[%] Indexed 35 Images on Page 8.


[%] Downloading Image #35 from https://images.hellomagazine.com/imagenes/healthandbeauty/health-and-fitness/20

[%] File Downloaded !

[%] Downloading Image #56 from https://pagesix.com/wp-content/uploads/sites/3/2023/08/NYPICHPDPICT000021739167.jpg
[%] File Downloaded !

[%] Downloading Image #57 from https://www.hollywoodreporter.com/wp-content/uploads/2023/06/Chris-Hemsworth-getty-1498028326-H-2023.jpg
[Error]Invalid image, not saving https://www.hollywoodreporter.com/wp-content/uploads/2023/06/Chris-Hemsworth-getty-1498028326-H-2023.jpg

[!] Issue getting: https://www.hollywoodreporter.com/wp-content/uploads/2023/06/Chris-Hemsworth-getty-1498028326-H-2023.jpg
[!] Error:: Invalid image, not saving https://www.hollywoodreporter.com/wp-content/uploads/2023/06/Chris-Hemsworth-getty-1498028326-H-2023.jpg

[%] Downloading Image #57 from https://new-cdn.mamamia.com.au/mamamia-pwa.appspot.com/cms_images/originals/DoRNovO36Rlu75omIcuJ_1668900176800.jpg
[%] File Downloaded !

[%] Downloading Image #58 from https://wcelebrity.com/wp-content/uploads/2023/08/Chris-Hemsworth.png
[%] File Downloaded !

[%]

[!] Issue getting: https://cosmicbook.news/wp-content/uploads/2023/01/chris-hemsworth-extraction-2-release-date-footage.jpg
[!] Error:: HTTP Error 404: Not Found
[%] Downloading Image #91 from https://static1.moviewebimages.com/wordpress/wp-content/uploads/2023/05/chris-hemsworth-in-extraction-2.jpeg
[%] File Downloaded !

[%] Downloading Image #92 from https://images.wallpapersden.com/image/download/extraction-2-chris-hemsworth-action_bmVnbG2UmZqaraWkpJRnaWVlrWZoamU.jpg
[%] File Downloaded !

[%] Downloading Image #93 from https://img.uhdpaper.com/wallpaper/extraction-2-chris-hemsworth-movie-291@1@k-phone-4k.jpg
[Error]Invalid image, not saving https://img.uhdpaper.com/wallpaper/extraction-2-chris-hemsworth-movie-291@1@k-phone-4k.jpg

[!] Issue getting: https://img.uhdpaper.com/wallpaper/extraction-2-chris-hemsworth-movie-291@1@k-phone-4k.jpg
[!] Error:: Invalid image, not saving https://img.uhdpaper.com/wallpaper/extraction-2-chris-hemsworth-movie-291@1@k-phone-4k.jpg

[%] Downloadin

100%|██████████| 93/93 [00:07<00:00, 12.64it/s]


[%] Downloading Images to /opt/jupyter/notebook/web_scraping/temp_imagens/Bruce Willis


[!!]Indexing page: 1

[%] Indexed 35 Images on Page 1.


[%] Downloading Image #1 from https://2.bp.blogspot.com/-dThCvec16-c/UfifzGwaA_I/AAAAAAAAA3Q/f-oeGEh7PSs/s1600/Bruce-Willis.jpg
[%] File Downloaded !

[%] Downloading Image #2 from https://cdn.britannica.com/48/194248-050-4EE825CF/Bruce-Willis-2013.jpg
[Error]Invalid image, not saving https://cdn.britannica.com/48/194248-050-4EE825CF/Bruce-Willis-2013.jpg

[!] Issue getting: https://cdn.britannica.com/48/194248-050-4EE825CF/Bruce-Willis-2013.jpg
[!] Error:: Invalid image, not saving https://cdn.britannica.com/48/194248-050-4EE825CF/Bruce-Willis-2013.jpg

[%] Downloading Image #2 from https://short-biography.com/wp-content/uploads/bruce-willis/W.B.-Willis.jpg
[%] File Downloaded !

[%] Downloading Image #3 from https://upload.wikimedia.org/wikipedia/commons/0/03/Bruce_Willis_by_Gage_Skidmore.jpg
[%] File Downloaded !

[%] Downloading Image #4 

[%] File Downloaded !

[%] Downloading Image #41 from https://people.com/thmb/olTbjA-Of3uU44CB4EhYXn6nkCY=/1500x0/filters:no_upscale():max_bytes(150000):strip_icc():focal(649x179:651x181)/Bruce-willis-090422-2000-e17851c4524f43689e074d6f7b6c684a.jpg
[%] File Downloaded !

[%] Downloading Image #42 from https://nypost.com/wp-content/uploads/sites/2/2023/12/bruce-willis-holds-onto-daughter-72825385.jpg
[%] File Downloaded !

[%] Downloading Image #43 from https://www.the-sun.com/wp-content/uploads/sites/6/2023/03/sad-times-bruce-willis-fans-804496385.jpg
[%] File Downloaded !

[%] Downloading Image #44 from https://s.abcnews.com/images/GMA/230405_gma_digital_bruce_willis_hpMain_1x1_992.jpg
[%] File Downloaded !

[%] Downloading Image #45 from https://pagesix.com/wp-content/uploads/sites/3/2023/03/NYPICHPDPICT000007546519.jpg?quality=90&amp;strip=all
[%] File Downloaded !

[%] Downloading Image #46 from https://cdn.abcotvs.com/dip/images/13328637_060123-wls-tallullah-willis-bruce-dementia

[%] File Downloaded !



[!!]Indexing page: 12

[%] Indexed 35 Images on Page 12.


[%] Downloading Image #85 from http://images2.fanpop.com/images/photos/4800000/Bruce-bruce-willis-4866240-1024-768.jpg
[%] File Downloaded !

[%] Downloading Image #86 from http://www.actors-pictures.com/pictures/bruce-willis-40.jpg
[!] Issue getting: http://www.actors-pictures.com/pictures/bruce-willis-40.jpg
[!] Error:: HTTP Error 404: Not Found


[!!]Indexing page: 13

[%] Indexed 35 Images on Page 13.


[%] Downloading Image #86 from http://blog.fingerprintdoorlocks.com/wp-content/uploads/2012/06/bruce_willis.jpg
[%] File Downloaded !



[!!]Indexing page: 14

[%] Indexed 35 Images on Page 14.


[%] Downloading Image #87 from http://images1.fanpop.com/images/image_uploads/Bruce-Willis-bruce-willis-817692_1024_768.jpg
[%] File Downloaded !



[!!]Indexing page: 15

[%] Indexed 35 Images on Page 15.




[!!]Indexing page: 16

[%] Indexed 35 Images on Page 16.




[!!]Indexing page: 17

[%] Indexed 35 



temp_imagens/bruce_willis/Image_90.PNG
temp_imagens/bruce_willis/Image_91.jpg
temp_imagens/bruce_willis/Image_92.jpg
temp_imagens/bruce_willis/Image_93.jpg
temp_imagens/bruce_willis/Image_94.jpg
temp_imagens/bruce_willis/Image_95.jpg
temp_imagens/bruce_willis/Image_96.jpg
temp_imagens/bruce_willis/Image_97.png
temp_imagens/bruce_willis/Image_98.jpg
temp_imagens/bruce_willis/Image_99.jpg
temp_imagens/bruce_willis/Image_100.jpg


100%|██████████| 93/93 [00:08<00:00, 10.49it/s]


[%] Downloading Images to /opt/jupyter/notebook/web_scraping/temp_imagens/Sandra Bullock


[!!]Indexing page: 1

[%] Indexed 35 Images on Page 1.


[%] Downloading Image #1 from https://www.sheknows.com/wp-content/uploads/2022/06/sandra-bullock.jpg
[%] File Downloaded !

[%] Downloading Image #2 from https://faroutmagazine.co.uk/static/uploads/1/2022/12/When-Sandra-Bullock-graciously-accepted-a-Razzie-award.jpg
[%] File Downloaded !

[%] Downloading Image #3 from https://i.dailymail.co.uk/1s/2023/03/12/19/68611515-11851113-image-m-66_1678649952952.jpg
[%] File Downloaded !

[%] Downloading Image #4 from https://nationaltoday.com/wp-content/uploads/2022/10/19-Sandra-Bullock.jpg
[Error]Invalid image, not saving https://nationaltoday.com/wp-content/uploads/2022/10/19-Sandra-Bullock.jpg

[!] Issue getting: https://nationaltoday.com/wp-content/uploads/2022/10/19-Sandra-Bullock.jpg
[!] Error:: Invalid image, not saving https://nationaltoday.com/wp-content/uploads/2022/10/19-Sandra-Bullock.jp

[%] File Downloaded !

[%] Downloading Image #37 from http://images4.fanpop.com/image/photos/19800000/Sandra-Bullock-sandra-bullock-19873201-1472-2000.jpg
[%] File Downloaded !

[%] Downloading Image #38 from http://how-rich.com/wp-content/uploads/2012/09/SandraBullockMay-attrbAngelaGeorge.jpg
[!] Issue getting: http://how-rich.com/wp-content/uploads/2012/09/SandraBullockMay-attrbAngelaGeorge.jpg
[!] Error:: <urlopen error timed out>
[%] Downloading Image #38 from http://www.theplace2.ru/archive/sandra_bullock/img/msg_126283576998_3.jpg
[%] File Downloaded !

[%] Downloading Image #39 from http://upload.wikimedia.org/wikipedia/commons/6/67/Sandra_Bullock_2011_AA.jpg
[%] File Downloaded !

[%] Downloading Image #40 from https://ucesy-sk.happyhair.sk/celebrity_img/bullock1au2309.jpg
[%] File Downloaded !

[%] Downloading Image #41 from http://images.fanpop.com/images/image_uploads/Sandra-Bullock-sandra-bullock-87419_1024_768.jpg
[%] File Downloaded !

[%] Downloading Image #42 from http:

[%] File Downloaded !

[%] Downloading Image #80 from https://www.giantfreakinrobot.com/wp-content/uploads/2023/08/sandra-bullock-demolition-man-900x506.jpg
[%] File Downloaded !

[%] Downloading Image #81 from https://i.insider.com/6254570dc9e897001814bc9d?width=1000&amp;format=jpeg&amp;auto=webp
[%] File Downloaded !

[%] Downloading Image #82 from https://www.ok-magazin.de/sites/default/files/styles/image870w/public/2023-08/sandra-bullock-mit-bryan-randall-maerz-2016-ddp.jpg?h=25c60405
[%] File Downloaded !

[%] Downloading Image #83 from https://img.onmanorama.com/content/dam/mm/en/entertainment/entertainment-news/images/2023/8/8/bryan-randall.jpg
[%] File Downloaded !

[%] Downloading Image #84 from https://i.dailymail.co.uk/1s/2023/08/15/02/74317043-12407103-Sandra_Bullock_was_pictured_for_the_first_time_since_the_tragic_-a-19_1692063653849.jpg
[%] File Downloaded !

[%] Downloading Image #85 from https://netstorage-kami.akamaized.net/images/f3377e01fee15a63.png?imwidth=900
[%] F

temp_imagens/sandra_bullock/Image_64.jpg
temp_imagens/sandra_bullock/Image_65.jpg
temp_imagens/sandra_bullock/Image_66.jpg
temp_imagens/sandra_bullock/Image_67.jpg
temp_imagens/sandra_bullock/Image_68.jpg
temp_imagens/sandra_bullock/Image_69.jpg
temp_imagens/sandra_bullock/Image_70.jpg
temp_imagens/sandra_bullock/Image_71.jpg
temp_imagens/sandra_bullock/Image_72.jpg
temp_imagens/sandra_bullock/Image_73.jpg
temp_imagens/sandra_bullock/Image_74.jpg
temp_imagens/sandra_bullock/Image_75.jpg
temp_imagens/sandra_bullock/Image_76.jpg
temp_imagens/sandra_bullock/Image_77.jpg
temp_imagens/sandra_bullock/Image_78.jpg
temp_imagens/sandra_bullock/Image_79.jpg
temp_imagens/sandra_bullock/Image_80.jpg
temp_imagens/sandra_bullock/Image_81.jpg
temp_imagens/sandra_bullock/Image_82.jpg
Remove image: temp_imagens/sandra_bullock/Image_82.jpg
temp_imagens/sandra_bullock/Image_83.jpg
temp_imagens/sandra_bullock/Image_84.jpg
Remove image: temp_imagens/sandra_bullock/Image_84.jpg
temp_imagens/sandra_bullock/I

100%|██████████| 93/93 [00:09<00:00,  9.90it/s]


[%] Downloading Images to /opt/jupyter/notebook/web_scraping/temp_imagens/Bradley Cooper


[!!]Indexing page: 1

[%] Indexed 35 Images on Page 1.


[%] Downloading Image #1 from https://www.newdvdreleasedates.com/images/profiles/bradley-cooper-13.jpg
[!] Issue getting: https://www.newdvdreleasedates.com/images/profiles/bradley-cooper-13.jpg
[!] Error:: HTTP Error 404: Not Found
[%] Downloading Image #1 from https://upload.wikimedia.org/wikipedia/commons/b/bd/Glasto17-44_(35547413626)_Cropped.jpg
[%] File Downloaded !

[%] Downloading Image #2 from https://www.biography.com/.image/t_share/MTE1ODA0OTcxNTEyODU4MTI1/bradley-cooper-547062-1-402.jpg
[!] Issue getting: https://www.biography.com/.image/t_share/MTE1ODA0OTcxNTEyODU4MTI1/bradley-cooper-547062-1-402.jpg
[!] Error:: HTTP Error 404: Not Found
[%] Downloading Image #2 from http://photos.laineygossip.com/articles/bradley-cooper-nom-15jan15-07.jpg
[%] File Downloaded !

[%] Downloading Image #3 from https://www.usmagazine.com/wp-conten

[%] Indexed 35 Images on Page 7.


[%] Downloading Image #33 from http://www.aceshowbiz.com/images/wennpic/bradley-cooper-16th-annual-hollywood-film-awards-gala-01.jpg
[%] File Downloaded !



[!!]Indexing page: 8

[%] Indexed 35 Images on Page 8.


[%] Downloading Image #34 from http://image.tmdb.org/t/p/original/rxUG6unp3zfLZrR9RxCNtcXTbk.jpg
[%] File Downloaded !



[!!]Indexing page: 9

[%] Indexed 35 Images on Page 9.


[%] Downloading Image #35 from http://photos.laineygossip.com/articles/bradley-cooper-nom-15jan15-05.jpg
[%] File Downloaded !

[%] Downloading Image #36 from https://media.gq-magazine.co.uk/photos/5d13ab2b92ae5fb0c3a33930/master/w_1920%2cc_limit/bradley-cooper-06-gq-3jan19_getty_b.jpg
[%] File Downloaded !



[!!]Indexing page: 10

[%] Indexed 35 Images on Page 10.




[!!]Indexing page: 11

[%] Indexed 35 Images on Page 11.


[%] Downloading Image #37 from https://cdn.vox-cdn.com/thumbor/d40WguuYhkbE9RSjBoNA-tlfnHE=/0x0:2261x2749/1200x0/filters:focal(0x0:2261x274

[Error]Invalid image, not saving https://e3.365dm.com/24/01/768x432/skynews-bradley-cooper-golden-globes_6414454.jpg?20240108005857

[!] Issue getting: https://e3.365dm.com/24/01/768x432/skynews-bradley-cooper-golden-globes_6414454.jpg?20240108005857
[!] Error:: Invalid image, not saving https://e3.365dm.com/24/01/768x432/skynews-bradley-cooper-golden-globes_6414454.jpg?20240108005857



[!!]Indexing page: 13

[%] Indexed 35 Images on Page 13.


[%] Downloading Image #66 from https://photos.laineygossip.com/articles/bradley-cooper-asib-25sept18-01.jpg
[%] File Downloaded !



[!!]Indexing page: 14

[%] Indexed 35 Images on Page 14.


[%] Downloading Image #67 from http://actor-images.celebritizer.com/actor/116029/Bradley-Cooper.jpg
[%] File Downloaded !



[!!]Indexing page: 15

[%] Indexed 35 Images on Page 15.


[%] Downloading Image #68 from https://www.thefamouspeople.com/profiles/images/bradley-cooper-1.jpg
[%] File Downloaded !



[!!]Indexing page: 16

[%] Indexed 35 Images on P

[%] File Downloaded !



[%] Done. Downloaded 100 images.
temp_imagens/bradley_cooper/Image_1.jpg
temp_imagens/bradley_cooper/Image_2.jpg
temp_imagens/bradley_cooper/Image_3.jpg
temp_imagens/bradley_cooper/Image_4.jpg
temp_imagens/bradley_cooper/Image_5.jpg
temp_imagens/bradley_cooper/Image_6.jpg
temp_imagens/bradley_cooper/Image_7.jpg
temp_imagens/bradley_cooper/Image_8.jpg
temp_imagens/bradley_cooper/Image_9.jpg
temp_imagens/bradley_cooper/Image_10.jpg
temp_imagens/bradley_cooper/Image_11.jpg
temp_imagens/bradley_cooper/Image_12.jpg
temp_imagens/bradley_cooper/Image_13.jpg
temp_imagens/bradley_cooper/Image_14.jpg
temp_imagens/bradley_cooper/Image_15.jpg
temp_imagens/bradley_cooper/Image_16.jpg
temp_imagens/bradley_cooper/Image_17.jpg
temp_imagens/bradley_cooper/Image_18.jpg
Remove image: temp_imagens/bradley_cooper/Image_18.jpg
temp_imagens/bradley_cooper/Image_19.jpg
temp_imagens/bradley_cooper/Image_20.jpg
temp_imagens/bradley_cooper/Image_21.jpg
temp_imagens/bradley_cooper/Image_2

100%|██████████| 97/97 [00:09<00:00, 10.19it/s]


[%] Downloading Images to /opt/jupyter/notebook/web_scraping/temp_imagens/Tom Hardy


[!!]Indexing page: 1

[%] Indexed 35 Images on Page 1.


[%] Downloading Image #1 from https://d.newsweek.com/en/full/784947/tom-hardy.jpg
[%] File Downloaded !

[%] Downloading Image #2 from http://images6.fanpop.com/image/photos/39200000/Tom-Hardy-tom-hardy-39213950-928-1326.jpg
[%] File Downloaded !

[%] Downloading Image #3 from http://images4.fanpop.com/image/photos/20300000/Tom-Hardy-tom-hardy-20320916-1011-1280.jpg
[%] File Downloaded !

[%] Downloading Image #4 from http://images6.fanpop.com/image/photos/32700000/Tom-Hardy-Photo-Shoot-tom-hardy-32767822-750-960.jpg
[%] File Downloaded !

[%] Downloading Image #5 from http://image.tmdb.org/t/p/original/j1zJKn5dr3VQC3upjgHL68cnPcB.jpg
[%] File Downloaded !

[%] Downloading Image #6 from https://www.thefamouspeople.com/profiles/images/tom-hardy-1.jpg
[%] File Downloaded !

[%] Downloading Image #7 from https://ilarge.lisimg.com/image/7976369/1118

[%] File Downloaded !

[%] Downloading Image #36 from https://static1.cbrimages.com/wordpress/wp-content/uploads/2024/02/tom-hardy-the-bikeriders.jpg
[%] File Downloaded !

[%] Downloading Image #37 from https://cdn.shopify.com/s/files/1/0030/3742/9849/files/Tom_Hardy_s_Details.jpg?v=1674662344
[%] File Downloaded !

[%] Downloading Image #38 from https://www.indiewire.com/wp-content/uploads/2022/07/AP21257649752518.jpg?w=780
[%] File Downloaded !

[%] Downloading Image #39 from https://e00-marca.uecdn.es/assets/multimedia/imagenes/2023/03/28/16800057962197.jpg
[%] File Downloaded !

[%] Downloading Image #40 from https://www.slashfilm.com/img/gallery/tom-hardy-turned-his-gangster-roles-into-a-career-long-character-study/l-intro-1662586451.jpg
[%] File Downloaded !

[%] Downloading Image #41 from https://meforworld.com/wp-content/uploads/2022/07/Tom_Hardy.jpg
[%] File Downloaded !

[%] Downloading Image #42 from https://www.thedigitalfix.com/wp-content/sites/thedigitalfix/2023/09/tom-h

[%] File Downloaded !

[%] Downloading Image #69 from http://image.tmdb.org/t/p/original/9MCdyZJkwyXmymMIrA1uvEWzaWU.jpg
[%] File Downloaded !

[%] Downloading Image #70 from https://ilarge.lisimg.com/image/7947693/740full-tom-hardy.jpg
[%] File Downloaded !

[%] Downloading Image #71 from https://manofmany.com/wp-content/uploads/2022/04/6-Tom-Hardy-Workout-Diet-Plan-1200x900.jpg
[%] File Downloaded !

[%] Downloading Image #72 from https://tzm.vn/uploads/images/blog/admin/2024/01/23/tom-hardy-1705951391.webp
[%] File Downloaded !

[%] Downloading Image #73 from https://i.dailymail.co.uk/1s/2022/09/20/10/62610727-0-image-a-52_1663667158129.jpg
[%] File Downloaded !

[%] Downloading Image #74 from https://media.ghgossip.com/wp-content/uploads/2023/05/25144818/Tom-Hardy-768x511.jpg
[%] File Downloaded !

[%] Downloading Image #75 from https://www.eightieskids.com/wp-content/uploads/2018/11/Tom-Hardy-2.jpg
[%] File Downloaded !

[%] Downloading Image #76 from https://manofmany.com/wp-cont

temp_imagens/tom_hardy/Image_45.jpg
temp_imagens/tom_hardy/Image_46.jpg
temp_imagens/tom_hardy/Image_47.JPG
temp_imagens/tom_hardy/Image_48.jpg
temp_imagens/tom_hardy/Image_49.jpg
temp_imagens/tom_hardy/Image_50.jpg
temp_imagens/tom_hardy/Image_51.jpg
temp_imagens/tom_hardy/Image_52.png
temp_imagens/tom_hardy/Image_53.jpg
temp_imagens/tom_hardy/Image_54.jpg
Remove image: temp_imagens/tom_hardy/Image_54.jpg
temp_imagens/tom_hardy/Image_55.png
temp_imagens/tom_hardy/Image_56.jpg
temp_imagens/tom_hardy/Image_57.jpg
temp_imagens/tom_hardy/Image_58.jpg
temp_imagens/tom_hardy/Image_59.jpg
temp_imagens/tom_hardy/Image_60.jpg
temp_imagens/tom_hardy/Image_61.jpg
temp_imagens/tom_hardy/Image_62.jpg
temp_imagens/tom_hardy/Image_63.jpg
temp_imagens/tom_hardy/Image_64.jpg
temp_imagens/tom_hardy/Image_65.jpg
temp_imagens/tom_hardy/Image_66.jpg
Remove image: temp_imagens/tom_hardy/Image_66.jpg
temp_imagens/tom_hardy/Image_67.jpg
temp_imagens/tom_hardy/Image_68.jpg
temp_imagens/tom_hardy/Image_69.jpg


100%|██████████| 92/92 [00:09<00:00, 10.15it/s]
