In [4]:
# Install dependencies
!pip install beautifulsoup4 requests

# Import library
import requests
from bs4 import BeautifulSoup
from IPython.display import Image, display
import os

# Target URL
url = "https://megamitensei.fandom.com/wiki/Persona_4"

# Request halaman web
response = requests.get(url)
if response.status_code == 200:
    print("Situs berhasil diakses!")
else:
    print(f"Gagal mengakses situs, kode status: {response.status_code}")

# Parsing konten HTML
soup = BeautifulSoup(response.content, "html.parser")

# Mengambil data teks (judul, deskripsi, dan daftar poin)
def scrape_text():
    # Mengambil judul halaman
    title = soup.find("h1", {"class": "page-header__title"})
    if title:
        print(f"Judul Halaman: {title.get_text(strip=True)}")
    else:
        print("Judul halaman tidak ditemukan.")

    # Mengambil deskripsi/summary
    summary = soup.find("div", {"class": "mw-parser-output"})
    if summary:
        print("\n== Deskripsi Singkat ==")
        paragraphs = summary.find_all("p")
        for i, p in enumerate(paragraphs[:3]):  # Menampilkan 3 paragraf pertama
            print(f"Paragraf {i+1}:\n{p.get_text(strip=True)}\n")
    else:
        print("Deskripsi tidak ditemukan.")

    # Mengambil daftar poin (jika ada)
    print("\n== Daftar Poin ==")
    bullet_points = summary.find_all("ul")
    if bullet_points:
        for ul in bullet_points[:2]:  # Batas 2 daftar poin pertama
            for li in ul.find_all("li"):
                print(f"- {li.get_text(strip=True)}")
    else:
        print("Daftar poin tidak ditemukan.")

# Mengambil gambar utama berdasarkan kategori
def scrape_images():
    # Membuat folder untuk menyimpan gambar berdasarkan kategori
    os.makedirs("downloaded_images/small", exist_ok=True)
    os.makedirs("downloaded_images/large", exist_ok=True)

    # Mengambil semua elemen gambar
    images = soup.find_all("img", {"src": True})
    for i, img in enumerate(images):  # Proses semua gambar yang ditemukan
        img_url = img["src"]

        # Handle URL yang tidak lengkap
        if not img_url.startswith("http"):
            img_url = "https:" + img_url

        # Membandingkan ukuran gambar menggunakan atribut 'width' atau 'height' jika tersedia
        img_width = img.get("width")
        img_category = "small" if img_width and int(img_width) < 200 else "large"

        print(f"Gambar {i+1} ({img_category}): {img_url}")
        try:
            # Download gambar
            img_data = requests.get(img_url).content
            img_filename = f"downloaded_images/{img_category}/image_{i+1}.jpg"
            with open(img_filename, "wb") as f:
                f.write(img_data)
            print(f"Gambar {i+1} berhasil disimpan sebagai {img_filename}")

            # Tampilkan gambar di output
            display(Image(url=img_url))
        except Exception as e:
            print(f"Gagal mengunduh gambar: {e}")

# Jalankan fungsi scraping
print("\n== Data Teks ==")
scrape_text()
print("\n== Data Gambar Berdasarkan Kategori ==")
scrape_images()


Situs berhasil diakses!

== Data Teks ==
Judul Halaman: Persona 4

== Deskripsi Singkat ==
Paragraf 1:
Persona 4ペルソナ4Perusona 4Game InformationDeveloperAtlusPublisherAtlus (JPN, NA)Square Enix (EU)Ubisoft(AU)Sony(KR)GenreRPGPlatformPlayStation 2,PlayStation 3*SalesFirst WeekJapan (PS2) - 211,967[1]Life to DateJapan (PS2) - 358,899 (294,214 +The Best64,685)NA - 100kDevelopmentDirector(s)Katsura HashinoWriter(s)Yuichiro TanakaAkira KawasakiArtist(s)Shigenori SoejimaSusumu NishizawaDesigner(s)Atsushi WatanabeAzusa KidoProgrammer(s)Yujiro KosakaComposer(s)Shoji MeguroRelease DatesJapanJuly 10, 2008The BestAugust 5, 2010North AmericaPlayStation 2December 9, 2008PlayStation StoreApril 8, 2014EuropeMarch 13, 2009AustraliaMarch 12, 2009South KoreaOctober 31, 2008

Paragraf 2:
Persona 4, localized in the West asShin Megami Tensei: Persona 4, is the fifth game in thePersonaseries. The game was developed by Atlus for thePlayStation 2, and was ported to thePlayStation 3's PlayStation Store as a do

Gambar 2 (large): https://static.wikia.nocookie.net/megamitensei/images/e/e6/Site-logo.png/revision/latest?cb=20210626181118
Gambar 2 berhasil disimpan sebagai downloaded_images/large/image_2.jpg


Gambar 3 (large): https://static.wikia.nocookie.net/megamitensei/images/9/9b/P4-CoverArt.jpg/revision/latest/scale-to-width-down/350?cb=20160516234031
Gambar 3 berhasil disimpan sebagai downloaded_images/large/image_3.jpg


Gambar 4 (small): https://static.wikia.nocookie.net/megamitensei/images/6/60/Flag_of_Japan.png/revision/latest/scale-to-width-down/25?cb=20130115003127
Gambar 4 berhasil disimpan sebagai downloaded_images/small/image_4.jpg


Gambar 5 (small): https://static.wikia.nocookie.net/megamitensei/images/d/de/Flag_of_the_United_States.png/revision/latest/scale-to-width-down/25?cb=20170330020633
Gambar 5 berhasil disimpan sebagai downloaded_images/small/image_5.jpg


Gambar 6 (small): https://static.wikia.nocookie.net/megamitensei/images/1/19/Flag_of_Europe.png/revision/latest/scale-to-width-down/25?cb=20130115003016
Gambar 6 berhasil disimpan sebagai downloaded_images/small/image_6.jpg


Gambar 7 (small): https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D
Gagal mengunduh gambar: Invalid URL 'https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D': No host supplied
Gambar 8 (small): https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D
Gagal mengunduh gambar: Invalid URL 'https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D': No host supplied
Gambar 9 (large): https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D
Gagal mengunduh gambar: Invalid URL 'https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D': No host supplied
Gambar 10 (large): https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D
Gagal mengunduh gambar: Invalid URL 'https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAA

Gambar 12 (large): https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D
Gagal mengunduh gambar: Invalid URL 'https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D': No host supplied
Gambar 13 (large): https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D
Gagal mengunduh gambar: Invalid URL 'https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D': No host supplied
Gambar 14 (large): https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D
Gagal mengunduh gambar: Invalid URL 'https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D': No host supplied
Gambar 15 (large): https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D
Gagal mengunduh gambar: Invalid URL 'https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAA

Gambar 18 (large): https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D
Gagal mengunduh gambar: Invalid URL 'https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D': No host supplied
Gambar 19 (large): https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D
Gagal mengunduh gambar: Invalid URL 'https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D': No host supplied
Gambar 20 (large): https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D
Gagal mengunduh gambar: Invalid URL 'https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D': No host supplied
Gambar 21 (large): https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D
Gagal mengunduh gambar: Invalid URL 'https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAA

Gambar 27 (large): https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D
Gagal mengunduh gambar: Invalid URL 'https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D': No host supplied
Gambar 28 (large): https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D
Gagal mengunduh gambar: Invalid URL 'https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D': No host supplied
Gambar 29 (large): https://static.wikia.nocookie.net/megamitensei/images/3/3c/Dojimaresi.jpg/revision/latest/scale-to-width-down/250?cb=20090601135732
Gambar 29 berhasil disimpan sebagai downloaded_images/large/image_29.jpg


Gambar 30 (large): https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D
Gagal mengunduh gambar: Invalid URL 'https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D': No host supplied
Gambar 31 (large): https://static.wikia.nocookie.net/megamitensei/images/1/13/Brosuke.gif/revision/latest/scale-to-width-down/250?cb=20170211005706
Gambar 31 berhasil disimpan sebagai downloaded_images/large/image_31.jpg


Gambar 32 (large): https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D
Gagal mengunduh gambar: Invalid URL 'https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D': No host supplied
Gambar 33 (large): https://static.wikia.nocookie.net/megamitensei/images/f/fe/Midnight.png/revision/latest/scale-to-width-down/250?cb=20200904013026
Gambar 33 berhasil disimpan sebagai downloaded_images/large/image_33.jpg


Gambar 34 (large): https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D
Gagal mengunduh gambar: Invalid URL 'https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D': No host supplied
Gambar 35 (large): https://static.wikia.nocookie.net/megamitensei/images/8/80/Persona_4_Yukiko%27s_Castle_2.jpg/revision/latest/scale-to-width-down/250?cb=20111228060845
Gambar 35 berhasil disimpan sebagai downloaded_images/large/image_35.jpg


Gambar 36 (large): https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D
Gagal mengunduh gambar: Invalid URL 'https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D': No host supplied
Gambar 37 (large): https://static.wikia.nocookie.net/megamitensei/images/8/8e/Yip2.png/revision/latest/scale-to-width-down/250?cb=20160917122451
Gambar 37 berhasil disimpan sebagai downloaded_images/large/image_37.jpg


Gambar 38 (large): https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D
Gagal mengunduh gambar: Invalid URL 'https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D': No host supplied
Gambar 39 (large): https://static.wikia.nocookie.net/megamitensei/images/c/cf/AllOutP4.png/revision/latest/scale-to-width-down/250?cb=20160927185944
Gambar 39 berhasil disimpan sebagai downloaded_images/large/image_39.jpg


Gambar 40 (large): https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D
Gagal mengunduh gambar: Invalid URL 'https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D': No host supplied
Gambar 41 (large): https://static.wikia.nocookie.net/megamitensei/images/f/f1/ShuffleTimeP4.png/revision/latest/scale-to-width-down/250?cb=20160927190238
Gambar 41 berhasil disimpan sebagai downloaded_images/large/image_41.jpg


Gambar 42 (small): https://static.wikia.nocookie.net/megamitensei/images/f/fe/Persona_4_Logo_White.png/revision/latest/scale-to-width-down/185?cb=20210606140945
Gambar 42 berhasil disimpan sebagai downloaded_images/small/image_42.jpg


Gambar 43 (small): https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D
Gagal mengunduh gambar: Invalid URL 'https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D': No host supplied
Gambar 44 (small): https://static.wikia.nocookie.net/megamitensei/images/b/b1/Persona4cover.jpg/revision/latest/scale-to-width-down/130?cb=20080609040715
Gambar 44 berhasil disimpan sebagai downloaded_images/small/image_44.jpg


Gambar 45 (small): https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D
Gagal mengunduh gambar: Invalid URL 'https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D': No host supplied
Gambar 46 (small): https://static.wikia.nocookie.net/megamitensei/images/2/27/SMTPersona4cover.jpg/revision/latest/scale-to-width-down/131?cb=20090313085833
Gambar 46 berhasil disimpan sebagai downloaded_images/small/image_46.jpg


Gambar 47 (small): https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D
Gagal mengunduh gambar: Invalid URL 'https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D': No host supplied
Gambar 48 (small): https://static.wikia.nocookie.net/megamitensei/images/2/29/Persona_4.jpg/revision/latest/scale-to-width-down/131?cb=20090402213705
Gambar 48 berhasil disimpan sebagai downloaded_images/small/image_48.jpg


Gambar 49 (small): https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D
Gagal mengunduh gambar: Invalid URL 'https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D': No host supplied
Gambar 50 (small): https://static.wikia.nocookie.net/megamitensei/images/8/83/P4-Concept.jpg/revision/latest/scale-to-width-down/185?cb=20080810030201
Gambar 50 berhasil disimpan sebagai downloaded_images/small/image_50.jpg


Gambar 51 (small): https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D
Gagal mengunduh gambar: Invalid URL 'https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D': No host supplied
Gambar 52 (small): https://static.wikia.nocookie.net/megamitensei/images/a/a8/Persona_DoubleJump_Atlus_Interview.png/revision/latest/scale-to-width-down/185?cb=20141130072813
Gambar 52 berhasil disimpan sebagai downloaded_images/small/image_52.jpg


Gambar 53 (small): https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D
Gagal mengunduh gambar: Invalid URL 'https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D': No host supplied
Gambar 54 (large): https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D
Gagal mengunduh gambar: Invalid URL 'https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D': No host supplied
Gambar 55 (large): https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D
Gagal mengunduh gambar: Invalid URL 'https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D': No host supplied
Gambar 56 (large): https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAAAAABAAEAQAICTAEAOw%3D%3D
Gagal mengunduh gambar: Invalid URL 'https:data:image/gif;base64,R0lGODlhAQABAIABAAAAAP///yH5BAEAAAEALAAA

Gambar 64 (large): https://static.wikia.nocookie.net/ff185fe4-8356-4b6b-ad48-621b95a82a1d
Gambar 64 berhasil disimpan sebagai downloaded_images/large/image_64.jpg


Gambar 65 (large): https://static.wikia.nocookie.net/f3fc9271-3d5e-4c73-9afc-e6a9f6154ff1
Gambar 65 berhasil disimpan sebagai downloaded_images/large/image_65.jpg


Gambar 66 (large): https://static.wikia.nocookie.net/3f46912f-45a8-47f0-ac9d-6dca02c3a5ca
Gambar 66 berhasil disimpan sebagai downloaded_images/large/image_66.jpg


Gambar 67 (large): https://static.wikia.nocookie.net/6e8f2e52-ab5a-427f-a836-ab57168161ec
Gambar 67 berhasil disimpan sebagai downloaded_images/large/image_67.jpg
