From 25206b3827da64f66be27719598d5e01d2b754c4 Mon Sep 17 00:00:00 2001 From: zGadli Date: Sat, 6 Apr 2024 18:00:41 +0530 Subject: [PATCH] Fix bug in webtoon css selectors --- sources/en/w/webtoon.py | 8 +++++--- 1 file changed, 5 insertions(+), 3 deletions(-) diff --git a/sources/en/w/webtoon.py b/sources/en/w/webtoon.py index 941ec3856..478f36de1 100644 --- a/sources/en/w/webtoon.py +++ b/sources/en/w/webtoon.py @@ -11,7 +11,7 @@ class WebToonsCrawler(Crawler): has_manga = True base_url = ["https://www.webtoons.com/"] - search_url = "%ssearch?keyword=%s" + search_url = "%s/en/search?keyword=%s" def initialize(self) -> None: self.cleaner.bad_tags.update(["h3"]) @@ -28,7 +28,7 @@ def search_novel(self, query): results = [] for tab in soup.select("ul.card_lst li"): a = tab.select_one("a") - title = tab.select_one("p.subj") + title = tab.select_one("p.subj").get_text() results.append( { "title": title, @@ -38,7 +38,7 @@ def search_novel(self, query): for tab in soup1.select("div.challenge_lst.search ul"): a = tab.select_one("a.challenge_item") - title = tab.select_one("p.subj") + title = tab.select_one("p.subj").get_text() results.append( { "title": title, @@ -53,6 +53,8 @@ def read_novel_info(self): # need to check if there is only 1 pagination soup = self.get_soup(self.novel_url) possible_title = soup.select_one("h1.subj") + if possible_title is None: + possible_title = soup.select_one("h3.subj") self.novel_title = possible_title.text.strip() logger.info("Novel title: %s", self.novel_title)