From 4a60f6068a2dd4454384c0f2536c00326a1dacc3 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Mike=20F=C3=A4hrmann?= Date: Thu, 20 Jul 2017 16:02:09 +0200 Subject: [PATCH] [mangazuki] add manga extractor --- docs/supportedsites.rst | 2 +- gallery_dl/extractor/mangazuki.py | 26 +++++++++++++++++++++++++- 2 files changed, 26 insertions(+), 2 deletions(-) diff --git a/docs/supportedsites.rst b/docs/supportedsites.rst index 2d5af076..0f6b5392 100644 --- a/docs/supportedsites.rst +++ b/docs/supportedsites.rst @@ -49,7 +49,7 @@ Manga Stream https://mangastream.com/ Chapters Mangapanda http://www.mangapanda.com/ Chapters, Manga MangaPark http://mangapark.me/ Chapters, Manga Mangareader http://www.mangareader.net/ Chapters, Manga -Mangazuki https://mangazuki.co/ Chapters +Mangazuki https://mangazuki.co/ Chapters, Manga nhentai https://nhentai.net/ Galleries Niconico Seiga http://seiga.nicovideo.jp Images from Users, individual Images Required nijie https://nijie.info/ Images from Users, individual Images Required diff --git a/gallery_dl/extractor/mangazuki.py b/gallery_dl/extractor/mangazuki.py index 3eecfcc5..529576f3 100644 --- a/gallery_dl/extractor/mangazuki.py +++ b/gallery_dl/extractor/mangazuki.py @@ -8,7 +8,7 @@ """Extract manga-chapters and entire manga from https://mangazuki.co/""" -from .common import Extractor, Message +from .common import Extractor, MangaExtractor, Message from .. import text, exception @@ -58,3 +58,27 @@ class MangazukiChapterExtractor(Extractor): def get_images(page): """Return a list of all image-urls""" return list(text.extract_iter(page, 'data-src="', '"')) + + +class MangazukiMangaExtractor(MangaExtractor): + """Extractor for manga from mangazuki.co""" + category = "mangazuki" + pattern = [r"(?:https?://)?(?:www\.)?(mangazuki\.co/series/[^/?&#]+)"] + scheme = "https" + test = [("https://mangazuki.co/series/Double-Casting", { + "url": "aab747414191b14e768f4a1eb148448d83ef2e14", + })] + + def chapters(self, page): + params = {"page": 1} + chlist = [] + + while True: + chlist.extend( + text.extract_iter(page, '