From 9dde853fc5163144cca9417a81c5fe54c905c6e6 Mon Sep 17 00:00:00 2001 From: NecRaul Date: Fri, 4 Jul 2025 03:17:20 +0400 Subject: [PATCH] [warosu] HTML attribute fix --- gallery_dl/extractor/warosu.py | 16 ++++++++-------- 1 file changed, 8 insertions(+), 8 deletions(-) diff --git a/gallery_dl/extractor/warosu.py b/gallery_dl/extractor/warosu.py index a80d4c41..e78fd949 100644 --- a/gallery_dl/extractor/warosu.py +++ b/gallery_dl/extractor/warosu.py @@ -50,7 +50,7 @@ class WarosuThreadExtractor(Extractor): def metadata(self, page): boardname = text.extr(page, "", "") - title = text.unescape(text.extr(page, 'class="filetitle">', "<")) + title = text.unescape(text.extr(page, "class=filetitle>", "<")) return { "board" : self.board, "board_name": boardname.split(" - ")[1], @@ -60,14 +60,14 @@ class WarosuThreadExtractor(Extractor): def posts(self, page): """Build a list of all post objects""" - page = text.extr(page, '
") + page = text.extr(page, "
") needle = "" return [self.parse(post) for post in page.split(needle)] def parse(self, post): """Build post object by extracting data from an HTML post""" data = self._extract_post(post) - if '' in post and \ + if '', "<").strip(), - "time": extr('class="posttime" title="', '000">'), + "no" : extr("id=p", ">"), + "name": extr("class=postername>", "<").strip(), + "time": extr("class=posttime title=", "000>"), "com" : text.unescape(text.remove_html(extr( "
", "
").strip())), } @@ -92,9 +92,9 @@ class WarosuThreadExtractor(Extractor): data["h"] = extr("", ", ") data["filename"] = text.unquote(extr( "", "<").rstrip().rpartition(".")[0]) - extr("
", "") + extr("
", "") - url = extr('') + url = extr("") if url: if url[0] == "/": data["image"] = self.root + url