From f361cb13e0afbd699294acc8c871565410a4f01b Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Mike=20F=C3=A4hrmann?= Date: Sun, 26 Feb 2017 02:25:36 +0100 Subject: [PATCH] [hentai2read] fix extraction --- gallery_dl/extractor/hentai2read.py | 11 +++++++++-- 1 file changed, 9 insertions(+), 2 deletions(-) diff --git a/gallery_dl/extractor/hentai2read.py b/gallery_dl/extractor/hentai2read.py index 06800558..458519e5 100644 --- a/gallery_dl/extractor/hentai2read.py +++ b/gallery_dl/extractor/hentai2read.py @@ -11,6 +11,7 @@ from .. import text from . import hentaicdn import re +import json class Hentai2readMangaExtractor(hentaicdn.HentaicdnMangaExtractor): @@ -49,9 +50,9 @@ class Hentai2readChapterExtractor(hentaicdn.HentaicdnChapterExtractor): def __init__(self, match): hentaicdn.HentaicdnChapterExtractor.__init__(self) - self.url_title, self.chapter = match.groups() + url_title, self.chapter = match.groups() self.url = "http://hentai2read.com/{}/{}/".format( - self.url_title, self.chapter + url_title, self.chapter ) def get_job_metadata(self, page, images): @@ -66,3 +67,9 @@ class Hentai2readChapterExtractor(hentaicdn.HentaicdnChapterExtractor): "lang": "en", "language": "English", } + + @staticmethod + def get_image_urls(page): + """Extract and return a list of all image-urls""" + images = text.extract(page, "'images' : ", ",\n")[0] + return json.loads(images)