[batoto] add 'domain' option (#7174)

allow legacy domains by default
This commit is contained in:
Mike Fährmann
2025-03-14 09:10:58 +01:00
parent f395a3ec79
commit 22d46f2462
4 changed files with 52 additions and 12 deletions

View File

@@ -54,11 +54,23 @@ class BatotoBase():
"""Base class for batoto extractors"""
category = "batoto"
root = "https://xbato.org"
_warn_legacy = True
def _init_root(self, match):
domain = match.group(1)
if domain not in LEGACY_DOMAINS:
self.root = "https://" + domain
def _init_root(self):
domain = self.config("domain")
if domain is None or domain in {"auto", "url"}:
domain = self.groups[0]
if domain in LEGACY_DOMAINS:
if self._warn_legacy:
BatotoBase._warn_legacy = False
self.log.warning("Legacy domain '%s'", domain)
elif domain == "nolegacy":
domain = self.groups[0]
if domain in LEGACY_DOMAINS:
domain = "xbato.org"
elif domain == "nowarn":
domain = self.groups[0]
self.root = "https://" + domain
def request(self, url, **kwargs):
kwargs["encoding"] = "utf-8"
@@ -72,10 +84,10 @@ class BatotoChapterExtractor(BatotoBase, ChapterExtractor):
example = "https://xbato.org/title/12345-MANGA/54321"
def __init__(self, match):
self._init_root(match)
self.chapter_id = match.group(2)
url = "{}/title/0/{}".format(self.root, self.chapter_id)
ChapterExtractor.__init__(self, match, url)
ChapterExtractor.__init__(self, match, False)
self._init_root()
self.chapter_id = self.groups[1]
self.gallery_url = "{}/title/0/{}".format(self.root, self.chapter_id)
def metadata(self, page):
extr = text.extract_from(page)
@@ -133,10 +145,10 @@ class BatotoMangaExtractor(BatotoBase, MangaExtractor):
example = "https://xbato.org/title/12345-MANGA/"
def __init__(self, match):
self._init_root(match)
self.manga_id = match.group(2) or match.group(3)
url = "{}/title/{}".format(self.root, self.manga_id)
MangaExtractor.__init__(self, match, url)
MangaExtractor.__init__(self, match, False)
self._init_root()
self.manga_id = self.groups[1] or self.groups[2]
self.manga_url = "{}/title/{}".format(self.root, self.manga_id)
def chapters(self, page):
extr = text.extract_from(page)