Skip to content

Commit

Permalink
manga recommendation poster url parsing fix and updated cover to post…
Browse files Browse the repository at this point in the history
…er in json response
  • Loading branch information
Cosmicoppai committed Jun 9, 2024
1 parent 5e390d1 commit 7297726
Showing 1 changed file with 5 additions and 5 deletions.
10 changes: 5 additions & 5 deletions backend/scraper/manga_scraper.py
Original file line number Diff line number Diff line change
Expand Up @@ -99,7 +99,7 @@ async def __scrape_list(search_bs: BeautifulSoup) -> List[Dict[str, str]]:

media = title_bs.find("div", {"class": "media"})
media_a = media.find("div", {"class": "wrap_img"}).find("a")
manga["cover"] = media_a.find("img")["src"]
manga["poster"] = media_a.find("img")["src"]
manga["status"] = media.find("div", {"class": "status"}).text.strip().capitalize()

manga_session = media_a['href']
Expand All @@ -124,7 +124,7 @@ async def __scrape_detail(search_bs: BeautifulSoup) -> List[Dict[str, str]]:
for genre in meta_data.find("div", {"class": "genres"}).find_all("a"):
manga["genres"].append(genre.string)

manga["cover"] = search_bs.find("div", {"class": "cover"}).find("img")["src"]
manga["poster"] = search_bs.find("div", {"class": "cover"}).find("img")["src"]
manga["status"] = meta_data.find("div", {"class": "status"}).text.capitalize()
manga_url = search_bs.find("meta", property="og:url")["content"]
manga["manga_detail"] = f"{ServerConfig.API_SERVER_ADDRESS}/manga_detail?session={manga_url}"
Expand Down Expand Up @@ -177,13 +177,13 @@ async def get_recommendation(self, manga_session: str) -> List[Dict[str, str]]:

for rec in widget.find_all("div", {"class": "item"}):

recommendation = {"title": str, "total_eps": float, "cover": str, "status": str, "manga_detail": str} # noqa
recommendation = {"title": str, "total_chps": float, "poster": str, "status": str, "manga_detail": str} # noqa

recommendation["cover"] = rec.find("div", {"class": "wrap_img"}).find("a")["href"]
recommendation["poster"] = rec.find("div", {"class": "wrap_img"}).find("img")["data-src"]
rec_data = rec.find("div", {"class": "text"})
title_data = rec_data.find("h3")
recommendation["title"] = title_data.text
recommendation["total_eps"] = float(rec_data.find("div", {"class": "chapter"}).text.strip("Chapter ").split(" ")[0])
recommendation["total_chps"] = float(rec_data.find("div", {"class": "chapter"}).text.strip("Chapter ").split(" ")[0])
recommendation["status"] = rec_data.find("div", {"class": "status"}).text
manga_session = title_data.find('a')['href']
recommendation["manga_detail"] = f"{ServerConfig.API_SERVER_ADDRESS}/manga_detail?session={manga_session}"
Expand Down

0 comments on commit 7297726

Please sign in to comment.