From 1ca6be86190c661a63583170c31453e6e368ec1d Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Mike=20F=C3=A4hrmann?= Date: Mon, 10 Oct 2022 16:05:46 +0200 Subject: [PATCH] [fanbox] add 'content' metadata field (#3020) --- gallery_dl/extractor/fanbox.py | 20 ++++++++++++++++++++ 1 file changed, 20 insertions(+) diff --git a/gallery_dl/extractor/fanbox.py b/gallery_dl/extractor/fanbox.py index 84812480..013eb36c 100644 --- a/gallery_dl/extractor/fanbox.py +++ b/gallery_dl/extractor/fanbox.py @@ -68,6 +68,16 @@ class FanboxExtractor(Extractor): post["html"] = content_body["html"] if post["type"] == "article": post["articleBody"] = content_body.copy() + if "blocks" in content_body: + content = [] + append = content.append + for block in content_body["blocks"]: + if "text" in block: + append(block["text"]) + if "links" in block: + for link in block["links"]: + append(link["url"]) + post["content"] = "\n".join(content) post["date"] = text.parse_datetime(post["publishedDatetime"]) post["text"] = content_body.get("text") if content_body else None @@ -271,6 +281,16 @@ class FanboxPostExtractor(FanboxExtractor): "hasAdultContent": True }, }), + # 'content' metadata (#3020) + ("https://www.fanbox.cc/@official-en/posts/4326303", { + "keyword": { + "content": r"re:^Greetings from FANBOX.\n \n" + r"As of Monday, September 5th, 2022, we are happy " + r"to announce the start of the FANBOX hashtag " + r"event #MySetupTour ! \nAbout the event\n" + r"To join this event ...", + }, + }), ) def __init__(self, match):