68 lines
2.3 KiB
Python
68 lines
2.3 KiB
Python
# -*- coding: utf-8 -*-
|
|
|
|
# This program is free software; you can redistribute it and/or modify
|
|
# it under the terms of the GNU General Public License version 2 as
|
|
# published by the Free Software Foundation.
|
|
|
|
"""Extractors for https://www.wikifeet.com/"""
|
|
|
|
from .common import GalleryExtractor
|
|
from .. import text, util
|
|
|
|
|
|
class WikifeetGalleryExtractor(GalleryExtractor):
|
|
"""Extractor for image galleries from wikifeet.com"""
|
|
category = "wikifeet"
|
|
directory_fmt = ("{category}", "{celebrity}")
|
|
filename_fmt = "{category}_{celeb}_{pid}.{extension}"
|
|
archive_fmt = "{type}_{celeb}_{pid}"
|
|
pattern = (r"(?:https?://)(?:(?:www\.)?wikifeetx?|"
|
|
r"men\.wikifeet)\.com/([^/?#]+)")
|
|
example = "https://www.wikifeet.com/CELEB"
|
|
|
|
def __init__(self, match):
|
|
self.root = text.root_from_url(match[0])
|
|
if "wikifeetx.com" in self.root:
|
|
self.category = "wikifeetx"
|
|
self.type = "men" if "://men." in self.root else "women"
|
|
self.celeb = match[1]
|
|
GalleryExtractor.__init__(self, match, self.root + "/" + self.celeb)
|
|
|
|
def metadata(self, page):
|
|
extr = text.extract_from(page)
|
|
return {
|
|
"celeb" : self.celeb,
|
|
"type" : self.type,
|
|
"birthplace": text.unescape(extr('"bplace":"', '"')),
|
|
"birthday" : self.parse_datetime_iso(text.unescape(extr(
|
|
'"bdate":"', '"'))[:10]),
|
|
"shoesize" : text.unescape(extr('"ssize":', ',')),
|
|
"rating" : text.parse_float(extr('"score":', ',')),
|
|
"celebrity" : text.unescape(extr('"cname":"', '"')),
|
|
}
|
|
|
|
def images(self, page):
|
|
tagmap = {
|
|
"C": "Close-up",
|
|
"T": "Toenails",
|
|
"N": "Nylons",
|
|
"A": "Arches",
|
|
"S": "Soles",
|
|
"B": "Barefoot",
|
|
}
|
|
|
|
gallery = text.extr(page, '"gallery":[', '],')
|
|
base = f"https://pics.wikifeet.com/{self.celeb}-Feet-"
|
|
return [
|
|
(f"{base}{data['pid']}.jpg", {
|
|
"pid" : data["pid"],
|
|
"width" : data["pw"],
|
|
"height": data["ph"],
|
|
"tags" : [
|
|
tagmap[tag]
|
|
for tag in data["tags"] if tag in tagmap
|
|
],
|
|
})
|
|
for data in util.json_loads(f"[{gallery}]")
|
|
]
|