diff --git a/gallery_dl/extractor/nijie.py b/gallery_dl/extractor/nijie.py index 08c6c174..4c48d738 100644 --- a/gallery_dl/extractor/nijie.py +++ b/gallery_dl/extractor/nijie.py @@ -121,7 +121,7 @@ class NijieUserExtractor(NijieExtractor): r"/members(?:_illust)?\.php\?id=(\d+)") test = ( ("https://nijie.info/members_illust.php?id=44", { - "url": "4725cf3cd9cff4715db3c7e04dd7c323b9f2dec5", + "url": "66c4ff94c6e77c0765dd88f2d8c663055fda573e", "keyword": "d629c69e3172db1d7e026145e8eb640ac31ac16a", }), ("https://nijie.info/members_illust.php?id=43", { @@ -169,7 +169,7 @@ class NijieImageExtractor(NijieExtractor): r"/view(?:_popup)?\.php\?id=(\d+)") test = ( ("https://nijie.info/view.php?id=70720", { - "url": "c1881afd89b79af3d166545de15bab4d1e32c340", + "url": "5497f897311397dafa188521258624346a0af2a3", "keyword": "408393d010307c76d52cbd0a4368d6d357805aea", "content": "d85e3ea896ed5e4da0bca2390ad310a4df716ca6", }), diff --git a/gallery_dl/extractor/simplyhentai.py b/gallery_dl/extractor/simplyhentai.py index 44dc6fe8..5ad372d3 100644 --- a/gallery_dl/extractor/simplyhentai.py +++ b/gallery_dl/extractor/simplyhentai.py @@ -23,7 +23,7 @@ class SimplyhentaiGalleryExtractor(GalleryExtractor): (("https://original-work.simply-hentai.com" "/amazon-no-hiyaku-amazon-elixir"), { "url": "258289249990502c3138719cb89e995a60861e49", - "keyword": "18ab9defca53dbb2aeb7965193e93e0ea125b76b", + "keyword": "eba83ccdbab3022a2280c77aa747f9458196138b", }), ("https://www.simply-hentai.com/notfound", { "exception": exception.GalleryDLException, @@ -40,30 +40,26 @@ class SimplyhentaiGalleryExtractor(GalleryExtractor): self.session.headers["Referer"] = url def metadata(self, page): - extr = text.extract - title , pos = extr(page, 'Series', '', pos) - lang , pos = extr(page, 'box-title">Language', '', pos) - chars , pos = extr(page, 'box-title">Characters', '', pos) - tags , pos = extr(page, 'box-title">Tags', '', pos) - artist, pos = extr(page, 'box-title">Artists', '', pos) - date , pos = extr(page, 'Uploaded', '', pos) - lang = text.remove_html(lang) if lang else None - - return { - "gallery_id": text.parse_int(gid), + data = { "title" : text.unescape(title), - "artist" : text.split_html(artist), - "parody" : text.split_html(series), - "characters": text.split_html(chars), - "tags" : text.split_html(tags), - "lang" : util.language_to_code(lang), - "language" : lang, - "date" : text.remove_html(date), + "gallery_id": text.parse_int(extr('/Album/', '/')), + "parody" : split(extr('box-title">Series', '')), + "language" : text.remove_html(extr( + 'box-title">Language', '')) or None, + "characters": split(extr('box-title">Characters', '')), + "tags" : split(extr('box-title">Tags', '')), + "artist" : split(extr('box-title">Artists', '')), + "date" : text.parse_datetime(text.remove_html( + extr('Uploaded', '')), "%d.%m.%Y"), } + data["lang"] = util.language_to_code(data["language"]) + return data def images(self, _): url = self.chapter_url + "/all-pages" @@ -102,12 +98,11 @@ class SimplyhentaiImageExtractor(Extractor): self.type = match.group(2) def items(self): - page = self.request(self.page_url).text - url_search = 'data-src="' if self.type == "image" else '