[imgdrive] add 'image' extractor (#7976)
This commit is contained in:
@@ -396,3 +396,17 @@ class PicstateImageExtractor(ImagehostImageExtractor):
|
||||
url , pos = text.extract(page, '<img src="', '"', pos)
|
||||
filename, pos = text.extract(page, 'alt="', '"', pos)
|
||||
return url, filename
|
||||
|
||||
|
||||
class ImgdriveImageExtractor(ImagehostImageExtractor):
|
||||
"""Extractor for single images from imgdrive.net"""
|
||||
category = "imgdrive"
|
||||
pattern = r"(?:https?://)?((?:www\.)?imgdrive\.net/img-(\w+)\.html)"
|
||||
example = "https://imgdrive.net/img-0123456789abc.html"
|
||||
|
||||
def get_info(self, page):
|
||||
title, pos = text.extract(
|
||||
page, 'property="og:title" content="', '"')
|
||||
url , pos = text.extract(
|
||||
page, 'property="og:image" content="', '"', pos)
|
||||
return url.replace("/small/", "/big/"), title.rsplit(" | ", 2)[0]
|
||||
|
||||
Reference in New Issue
Block a user