diff --git a/gallery_dl/extractor/nijie.py b/gallery_dl/extractor/nijie.py
index 08c6c174..4c48d738 100644
--- a/gallery_dl/extractor/nijie.py
+++ b/gallery_dl/extractor/nijie.py
@@ -121,7 +121,7 @@ class NijieUserExtractor(NijieExtractor):
r"/members(?:_illust)?\.php\?id=(\d+)")
test = (
("https://nijie.info/members_illust.php?id=44", {
- "url": "4725cf3cd9cff4715db3c7e04dd7c323b9f2dec5",
+ "url": "66c4ff94c6e77c0765dd88f2d8c663055fda573e",
"keyword": "d629c69e3172db1d7e026145e8eb640ac31ac16a",
}),
("https://nijie.info/members_illust.php?id=43", {
@@ -169,7 +169,7 @@ class NijieImageExtractor(NijieExtractor):
r"/view(?:_popup)?\.php\?id=(\d+)")
test = (
("https://nijie.info/view.php?id=70720", {
- "url": "c1881afd89b79af3d166545de15bab4d1e32c340",
+ "url": "5497f897311397dafa188521258624346a0af2a3",
"keyword": "408393d010307c76d52cbd0a4368d6d357805aea",
"content": "d85e3ea896ed5e4da0bca2390ad310a4df716ca6",
}),
diff --git a/gallery_dl/extractor/simplyhentai.py b/gallery_dl/extractor/simplyhentai.py
index 44dc6fe8..5ad372d3 100644
--- a/gallery_dl/extractor/simplyhentai.py
+++ b/gallery_dl/extractor/simplyhentai.py
@@ -23,7 +23,7 @@ class SimplyhentaiGalleryExtractor(GalleryExtractor):
(("https://original-work.simply-hentai.com"
"/amazon-no-hiyaku-amazon-elixir"), {
"url": "258289249990502c3138719cb89e995a60861e49",
- "keyword": "18ab9defca53dbb2aeb7965193e93e0ea125b76b",
+ "keyword": "eba83ccdbab3022a2280c77aa747f9458196138b",
}),
("https://www.simply-hentai.com/notfound", {
"exception": exception.GalleryDLException,
@@ -40,30 +40,26 @@ class SimplyhentaiGalleryExtractor(GalleryExtractor):
self.session.headers["Referer"] = url
def metadata(self, page):
- extr = text.extract
- title , pos = extr(page, 'Series', '', pos)
- lang , pos = extr(page, 'box-title">Language', '', pos)
- chars , pos = extr(page, 'box-title">Characters', '', pos)
- tags , pos = extr(page, 'box-title">Tags', '', pos)
- artist, pos = extr(page, 'box-title">Artists', '', pos)
- date , pos = extr(page, 'Uploaded', '', pos)
- lang = text.remove_html(lang) if lang else None
-
- return {
- "gallery_id": text.parse_int(gid),
+ data = {
"title" : text.unescape(title),
- "artist" : text.split_html(artist),
- "parody" : text.split_html(series),
- "characters": text.split_html(chars),
- "tags" : text.split_html(tags),
- "lang" : util.language_to_code(lang),
- "language" : lang,
- "date" : text.remove_html(date),
+ "gallery_id": text.parse_int(extr('/Album/', '/')),
+ "parody" : split(extr('box-title">Series', '')),
+ "language" : text.remove_html(extr(
+ 'box-title">Language', '')) or None,
+ "characters": split(extr('box-title">Characters', '')),
+ "tags" : split(extr('box-title">Tags', '')),
+ "artist" : split(extr('box-title">Artists', '')),
+ "date" : text.parse_datetime(text.remove_html(
+ extr('Uploaded', '')), "%d.%m.%Y"),
}
+ data["lang"] = util.language_to_code(data["language"])
+ return data
def images(self, _):
url = self.chapter_url + "/all-pages"
@@ -102,12 +98,11 @@ class SimplyhentaiImageExtractor(Extractor):
self.type = match.group(2)
def items(self):
- page = self.request(self.page_url).text
- url_search = 'data-src="' if self.type == "image" else '