add bilibili User Articles FavList support

- fix whitespace
- fix extractor names
- Add favlist url user check
- apply changes
- add test
- update docs/supportedsites
This commit is contained in:
mmmpipi
2025-01-06 15:35:49 +08:00
committed by Mike Fährmann
parent 18ed39c1cf
commit e4cc3419c5
4 changed files with 54 additions and 1 deletions

View File

@@ -136,7 +136,7 @@ Consider all listed sites to potentially be NSFW.
<tr>
<td>Bilibili</td>
<td>https://www.bilibili.com/</td>
<td>Articles, User Articles</td>
<td>Articles, User Articles, User Article Favorites</td>
<td></td>
</tr>
<tr>

View File

@@ -81,6 +81,27 @@ class BilibiliArticleExtractor(BilibiliExtractor):
yield Message.Url, url, text.nameext_from_url(url, article)
class BilibiliUserArticlesFavoriteExtractor(BilibiliExtractor):
subcategory = "user-articles-favorite"
pattern = (r"(?:https?://)?space\.bilibili\.com"
r"/(\d+)/favlist\?fid=opus")
example = "https://space.bilibili.com/12345/favlist?fid=opus"
_warning = True
def _init(self):
BilibiliExtractor._init(self)
if self._warning:
if not self.cookies_check(("SESSDATA",)):
self.log.error("'SESSDATA' cookie required")
BilibiliUserArticlesFavoriteExtractor._warning = False
def items(self):
for article in self.api.user_favlist():
article["_extractor"] = BilibiliArticleExtractor
url = "{}/opus/{}".format(self.root, article["opus_id"])
yield Message.Queue, url, article
class BilibiliAPI():
def __init__(self, extractor):
self.extractor = extractor
@@ -122,3 +143,28 @@ class BilibiliAPI():
raise exception.StopExtraction(
"%s: Unable to extract INITIAL_STATE data", article_id)
self.extractor.wait(seconds=300)
def user_favlist(self):
endpoint = "/opus/feed/fav"
params = {"page": 1, "page_size": 20}
while True:
data = self._call(endpoint, params)["data"]
yield from data["items"]
if not data.get("has_more"):
break
params["page"] += 1
def login_user_id(self):
url = "https://api.bilibili.com/x/space/v2/myinfo"
data = self.extractor.request(url).json()
if data["code"] != 0:
self.extractor.log.debug("Server response: %s", data)
raise exception.StopExtraction("API request failed,Are you login?")
try:
return data["data"]["profile"]["mid"]
except Exception:
raise exception.StopExtraction("API request failed")

View File

@@ -206,6 +206,7 @@ SUBCATEGORY_MAP = {
},
"bilibili": {
"user-articles": "User Articles",
"user-articles-favorite": "User Article Favorites",
},
"bluesky": {
"posts": "",

View File

@@ -65,4 +65,10 @@ __tests__ = (
"#class" : bilibili.BilibiliUserArticlesExtractor,
},
{
"#url" : "https://space.bilibili.com/405279279/favlist?fid=opus",
"#class" : bilibili.BilibiliUserArticlesFavoriteExtractor,
"#auth" : True,
},
)