[eporner] add support (#8581)

* [eporner] Add support * Line-length <80 chars * Fix flake8 indentation * update - generalize example URL - strip "Photo Gallery" from 'title' - extract 'id' * update supportedsites * update test results
2025-11-20 22:03:54 +05:00
parent 2bff6828e1
commit d74809c538
5 changed files with 106 additions and 0 deletions
--- a/gallery_dl/extractor/init.py
+++ b/gallery_dl/extractor/init.py
@@ -56,6 +56,7 @@ modules = [
    "discord",
    "dynastyscans",
    "e621",
+    "eporner",
    "erome",
    "everia",
    "exhentai",
--- a/gallery_dl/extractor/eporner.py
+++ b/gallery_dl/extractor/eporner.py
@@ -0,0 +1,54 @@
+# -*- coding: utf-8 -*-
+
+# This program is free software; you can redistribute it and/or modify
+# it under the terms of the GNU General Public License version 2 as
+# published by the Free Software Foundation.
+
+"""Extractors for https://www.eporner.com/"""
+
+from .common import GalleryExtractor
+from .. import text
+
+
+class EpornerGalleryExtractor(GalleryExtractor):
+    """Extractor for image galleries from eporner.com"""
+    category = "eporner"
+    root = "https://eporner.com"
+    pattern = (r"(?:https?://)?(?:www\.)?eporner\.com"
+               r"/gallery/(\w+)(?:/([\w-]+))?")
+    example = "https://www.eporner.com/gallery/GID/SLUG/"
+
+    def __init__(self, match):
+        url = f"{self.root}/gallery/{match[1]}/{match[2]}/"
+        GalleryExtractor.__init__(self, match, url)
+
+    def metadata(self, page):
+        title = text.extr(page, "<title>", " - EPORNER</title>")
+        if title.endswith(" Photo Gallery"):
+            title = title[:-14]
+
+        return {
+            "gallery_id": self.groups[0],
+            "title"     : text.unescape(title),
+            "slug"      : text.extr(
+                page, "/gallery/", '/"').rpartition("/")[2],
+            "description": text.unescape(text.extr(
+                page, 'name="description" content="', '"')),
+            "tags": text.extr(
+                page, 'EP.ads.keywords = "', '"').split(","),
+        }
+
+    def images(self, page):
+        album = text.extr(
+            page, 'class="photosgrid gallerygrid"', "id='gallerySlideBox'")
+
+        results = []
+        for url in text.extract_iter(album, ' src="', '"'):
+            url, _, ext = url.rpartition(".")
+            # Preview images have a resolution suffix.
+            # E.g. "11208293-image-3_296x1000.jpg".
+            # The same name, but without the suffix, leads to the full image.
+            url = url[:url.rfind("_")]
+            name = url[url.rfind("/")+1:]
+            results.append((f"{url}.{ext}", {"id": name[:name.find("-")]}))
+        return results