[cyberfile] add support (#5015)

This commit is contained in:
Mike Fährmann
2025-09-09 21:47:43 +02:00
parent 977e1bece3
commit 8617c08c6c
7 changed files with 247 additions and 0 deletions

View File

@@ -2036,6 +2036,20 @@ Description
uses the same domain as a given input URL.
extractor.cyberfile.password
----------------------------
Type
``string``
Default
``""``
Description
Password value used to access protected files and folders.
Note: Leave this value empty or undefined
to be interactively prompted for a password when needed
(see `getpass() <https://docs.python.org/3/library/getpass.html#getpass.getpass>`__).
extractor.[Danbooru].external
-----------------------------
Type

View File

@@ -237,6 +237,10 @@
{
"domain": null
},
"cyberfile":
{
"password": ""
},
"dankefuerslesen":
{
"zip": false

View File

@@ -211,6 +211,12 @@ Consider all listed sites to potentially be NSFW.
<td>Albums, Media Files</td>
<td></td>
</tr>
<tr id="cyberfile" title="cyberfile">
<td>CyberFile</td>
<td>https://cyberfile.me/</td>
<td>Files, Folders</td>
<td></td>
</tr>
<tr id="dankefuerslesen" title="dankefuerslesen">
<td>Danke fürs Lesen</td>
<td>https://danke.moe/</td>

View File

@@ -44,6 +44,7 @@ modules = [
"comick",
"comicvine",
"cyberdrop",
"cyberfile",
"danbooru",
"dankefuerslesen",
"desktopography",

View File

@@ -0,0 +1,114 @@
# -*- coding: utf-8 -*-
# Copyright 2025 Mike Fährmann
#
# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License version 2 as
# published by the Free Software Foundation.
"""Extractors for https://cyberfile.me/"""
from .common import Extractor, Message
from .. import text, exception
BASE_PATTERN = r"(?:https?://)?(?:www\.)?cyberfile\.me"
class CyberfileExtractor(Extractor):
"""Base class for cyberfile extractors"""
category = "cyberfile"
root = "https://cyberfile.me"
def request_api(self, endpoint, data):
url = f"{self.root}{endpoint}"
headers = {
"X-Requested-With": "XMLHttpRequest",
"Origin": self.root,
}
resp = self.request_json(
url, method="POST", headers=headers, data=data)
if "albumPasswordModel" in resp.get("javascript", ""):
url_pw = f"{self.root}/ajax/folder_password_process"
data_pw = {
"folderPassword": self._get_auth_info(password=True)[1],
"folderId": text.extr(
resp["html"], '<input type="hidden" value="', '"'),
"submitme": "1",
}
resp = self.request_json(
url_pw, method="POST", headers=headers, data=data_pw)
if not resp.get("success"):
raise exception.AuthorizationError(f"'{resp.get('msg')}'")
resp = self.request_json(
url, method="POST", headers=headers, data=data)
return resp
class CyberfileFolderExtractor(CyberfileExtractor):
subcategory = "folder"
pattern = rf"{BASE_PATTERN}/folder/([0-9a-f]+)"
example = "https://cyberfile.me/folder/0123456789abcdef/NAME"
def items(self):
folder_hash = self.groups[0]
url = f"{self.root}/folder/{folder_hash}"
folder_num = text.extr(self.request(url).text, "ages('folder', '", "'")
data = {
"pageType" : "folder",
"nodeId" : folder_num,
"pageStart": "1",
"perPage" : "0",
"filterOrderBy": "",
}
resp = self.request_api("/account/ajax/load_files", data)
folder = {
"_extractor" : CyberfileFileExtractor,
"folder_hash": folder_hash,
"folder_num" : text.parse_int(folder_num),
"folder" : resp["page_title"],
}
for url in text.extract_iter(resp["html"], 'dtfullurl="', '"'):
yield Message.Queue, url, folder
class CyberfileFileExtractor(CyberfileExtractor):
subcategory = "file"
directory_fmt = ("{category}", "{uploader}", "{folder}")
pattern = rf"{BASE_PATTERN}/([a-zA-Z0-9]+)"
example = "https://cyberfile.me/AbCdE"
def items(self):
file_id = self.groups[0]
url = f"{self.root}/{file_id}"
file_num = text.extr(self.request(url).text, "owFileInformation(", ")")
data = {"u": file_num}
resp = self.request_api("/account/ajax/file_details", data)
extr = text.extract_from(resp["html"])
info = text.split_html(extr('class="text-section">', "</span>"))
folder = info[0] if len(info) > 1 else ""
file = {
"file_id" : file_id,
"file_num": text.parse_int(file_num),
"name" : resp["page_title"],
"folder" : folder,
"uploader": info[-1][2:].strip(),
"size" : text.parse_bytes(text.remove_html(extr(
"Filesize:", "</tr>"))[:-1]),
"tags" : text.split_html(extr(
"Keywords:", "</tr>")),
"date" : text.parse_datetime(text.remove_html(extr(
"Uploaded:", "</tr>")), "%d/%m/%Y %H:%M:%S"),
"permissions": text.remove_html(extr(
"Permissions:", "</tr>")).split(" &amp; "),
}
file["file_url"] = url = extr("openUrl('", "'")
text.nameext_from_url(file["name"] or url, file)
yield Message.Directory, file
yield Message.Url, url, file

View File

@@ -42,6 +42,7 @@ CATEGORY_MAP = {
"cien" : "Ci-en",
"cohost" : "cohost!",
"comicvine" : "Comic Vine",
"cyberfile" : "CyberFile",
"dankefuerslesen": "Danke fürs Lesen",
"deviantart" : "DeviantArt",
"drawfriends" : "Draw Friends",

107
test/results/cyberfile.py Normal file
View File

@@ -0,0 +1,107 @@
# -*- coding: utf-8 -*-
# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License version 2 as
# published by the Free Software Foundation.
from gallery_dl.extractor import cyberfile
from gallery_dl import exception
__tests__ = (
{
"#url" : "https://cyberfile.me/bpfD",
"#class" : cyberfile.CyberfileFileExtractor,
"#pattern" : r"https://p1.cyberfile.me/bpfD/Raindrops.mp4\?download_token=[0-9a-f]{64}",
"#count" : 1,
"date" : "dt:2024-01-04 16:01:26",
"extension" : "mp4",
"file_id" : "bpfD",
"file_num" : 718677,
"file_url" : str,
"filename" : "Raindrops",
"folder" : "Videos",
"name" : "Raindrops.mp4",
"size" : 3659530,
"uploader" : "barbarella",
"permissions": [
"View",
"Download",
],
"tags" : [
"raindrops",
"mp4",
],
},
{
"#url" : "https://cyberfile.me/7d79",
"#comment" : "password-protected",
"#class" : cyberfile.CyberfileFileExtractor,
"#options" : {"password": "sample_pwd"},
"#pattern" : r"https://p1.cyberfile.me/7d79/Raindrops.mp4\?download_token=[0-9a-f]{64}",
"#count" : 1,
"date" : "dt:2024-01-04 17:50:59",
"extension" : "mp4",
"file_id" : "7d79",
"file_num" : 718711,
"file_url" : str,
"filename" : "Raindrops",
"folder" : "Playlist Protected",
"name" : "Raindrops.mp4",
"size" : 3659530,
"tags" : [],
"uploader" : "barbarella",
"permissions": [
"View",
"Download",
],
},
{
"#url" : "https://cyberfile.me/7d79",
"#comment" : "password-protected",
"#class" : cyberfile.CyberfileFileExtractor,
"#options" : {"password": "abc"},
"#exception": exception.AuthorizationError,
},
{
"#url" : "https://cyberfile.me/folder/82d0aab0853fdd13294171577081f4d8/Playlist",
"#class" : cyberfile.CyberfileFolderExtractor,
"#results" : (
"https://cyberfile.me/7d76",
"https://cyberfile.me/7d77",
),
"folder" : "Playlist",
"folder_hash": "82d0aab0853fdd13294171577081f4d8",
"folder_num" : 56050,
},
{
"#url" : "https://cyberfile.me/folder/1524a09fa9d773dcc88c841ed2e098c9/Playlist_Protected",
"#comment" : "password-protected",
"#class" : cyberfile.CyberfileFolderExtractor,
"#options" : {"password": "sample_pwd"},
"#results" : (
"https://cyberfile.me/7d7a",
"https://cyberfile.me/7d79",
),
"folder" : "Playlist Protected",
"folder_hash": "1524a09fa9d773dcc88c841ed2e098c9",
"folder_num" : 56051,
},
{
"#url" : "https://cyberfile.me/folder/1524a09fa9d773dcc88c841ed2e098c9/Playlist_Protected",
"#comment" : "password-protected",
"#class" : cyberfile.CyberfileFolderExtractor,
"#options" : {"password": "abc"},
"#exception": exception.AuthorizationError,
},
)