[imagehost] improve 'filename' & 'extension' handling

This commit is contained in:
Mike Fährmann
2025-11-04 17:00:37 +01:00
parent 7ed04d830e
commit e604c22812
2 changed files with 12 additions and 5 deletions

View File

@@ -58,8 +58,16 @@ class ImagehostImageExtractor(Extractor):
url, filename = self.get_info(page)
if not url:
return
data = text.nameext_from_url(filename, {"token": self.token})
if filename:
data = text.nameext_from_name(filename)
if not data["extension"]:
data["extension"] = text.ext_from_url(url)
else:
data = text.nameext_from_url(url)
data["token"] = self.token
data.update(self.metadata(page))
if self._https and url.startswith("http:"):
url = "https:" + url[5:]
if self._validate is not None:
@@ -341,7 +349,7 @@ class TurboimagehostImageExtractor(ImagehostImageExtractor):
def get_info(self, page):
url = text.extract(page, 'src="', '"', page.index("<img "))[0]
return url, url
return url, None
class TurboimagehostGalleryExtractor(ImagehostImageExtractor):
@@ -380,7 +388,7 @@ class ViprImageExtractor(ImagehostImageExtractor):
def get_info(self, page):
url = text.extr(page, '<img src="', '"')
return url, url
return url, None
class ImgclickImageExtractor(ImagehostImageExtractor):