Skip to content

Commit

Permalink
[mangakakalot] update URL patterns, fix flake8 errors (#876)
Browse files Browse the repository at this point in the history
  • Loading branch information
mikf committed Jul 13, 2020
1 parent 7dfdcc3 commit 9cd1bc6
Showing 1 changed file with 17 additions and 6 deletions.
23 changes: 17 additions & 6 deletions gallery_dl/extractor/mangakakalot.py
Original file line number Diff line number Diff line change
Expand Up @@ -30,8 +30,13 @@ def parse_page(page, data):

class MangakakalotChapterExtractor(MangakakalotBase, ChapterExtractor):
"""Extractor for manga-chapters from mangakakalot.com"""
archive_fmt = "{manga}_{chapter}_{page}"
pattern = r"(?:https?://)?mangakakalot\.com(/chapter/([a-z]+\d+)/chapter_([0-9.]+))"
pattern = (r"(?:https?://)?(?:www\.)?mangakakalot\.com"
r"(/chapter/(\w+)/chapter_([^/?&#]+))")
test = (
("https://mangakakalot.com/chapter/rx922077/chapter_6"),
("https://mangakakalot.com/chapter"
"/hatarakanai_futari_the_jobless_siblings/chapter_20.1"),
)

def __init__(self, match):
self.path, self.url_title, self.chapter = match.groups()
Expand All @@ -51,9 +56,11 @@ def metadata(self, chapter_page):
})
pos = page.index('href="' + churl + '"')
data["title"] , pos = text.extract(page, '>', '<', pos)
x = chpage.index('\n', chpage.index('<img', chpage.index('<div class="vung-doc"')))
x = chpage.index('\n', chpage.index(
'<img', chpage.index('<div class="vung-doc"')))
y = chpage.rfind('<img', 0, x)
data["count"] = text.parse_int(text.extract(chpage[y:x], 'page ', ' - Mangakakalot.com"')[0])
data["count"] = text.parse_int(text.extract(
chpage[y:x], 'page ', ' - Mangakakalot.com"')[0])
data["date"] , pos = text.extract(page, 'title="', '">', pos)
return data

Expand All @@ -74,8 +81,12 @@ def images(self, page):
class MangakakalotMangaExtractor(MangakakalotBase, MangaExtractor):
"""Extractor for manga from mangakakalot.com"""
chapterclass = MangakakalotChapterExtractor
reverse = False
pattern = r"(?:https?://)?mangakakalot\.com(/manga/([a-z]+\d+))"
pattern = (r"(?:https?://)?(?:www\.)?mangakakalot\.com"
r"(/(?:manga/|read-)\w+)")
test = (
("https://mangakakalot.com/manga/rx922077"),
("https://mangakakalot.com/read-ry3sw158504884246"),
)

def chapters(self, page):
results = []
Expand Down

0 comments on commit 9cd1bc6

Please sign in to comment.