[bellazon] use 'data-full-image' URLs if available (#8833)
This commit is contained in:
@@ -1,6 +1,6 @@
|
||||
# -*- coding: utf-8 -*-
|
||||
|
||||
# Copyright 2025 Mike Fährmann
|
||||
# Copyright 2025-2026 Mike Fährmann
|
||||
#
|
||||
# This program is free software; you can redistribute it and/or modify
|
||||
# it under the terms of the GNU General Public License version 2 as
|
||||
@@ -49,7 +49,11 @@ class BellazonExtractor(Extractor):
|
||||
yield Message.Directory, "", data
|
||||
data["num"] = data["num_internal"] = data["num_external"] = 0
|
||||
for info, url, url_img in urls:
|
||||
url = text.unescape(url or url_img)
|
||||
if url_img:
|
||||
url = text.unescape(
|
||||
text.extr(info, 'data-full-image="', '"') or url_img)
|
||||
else:
|
||||
url = text.unescape(url)
|
||||
|
||||
if url.startswith(native):
|
||||
if (
|
||||
|
||||
@@ -248,6 +248,28 @@ __tests__ = (
|
||||
"id" : r"re:^\d+$",
|
||||
},
|
||||
|
||||
{
|
||||
"#url" : "https://www.bellazon.com/main/topic/79152-sydney-sweeney/page/42/#comment-6113627",
|
||||
"#comment" : "'data-full-image' URLs (#8833)",
|
||||
"#class" : bellazon.BellazonPostExtractor,
|
||||
"#results" : (
|
||||
"https://www.wmagazine.com/culture/sydney-sweeney-cover-interview-the-housemaid-christy",
|
||||
"https://www.bellazon.com/main/uploads/monthly_2026_01/1222250126covershrinstagram2.jpg.9bca664c750694127c5c77c0e99db770.jpg",
|
||||
"https://www.bellazon.com/main/uploads/monthly_2026_01/1222250126covershrcms2.jpg.a4d33f2e157aec446f9e268cce576ddc.jpg",
|
||||
"https://www.bellazon.com/main/uploads/monthly_2026_01/1-0126broadsheetcmslo13-14.jpg.21f087b58d0d3cc5c7d03ea2bb62a979.jpg",
|
||||
),
|
||||
|
||||
"post" : {
|
||||
"author_id" : "145049",
|
||||
"author_slug": "matt",
|
||||
"author_url" : "https://www.bellazon.com/main/profile/145049-matt/",
|
||||
"content" : """<p style="text-align:center;">W Magazine's 2026 Best Performances issue</p><p style="text-align:center;">Sydney Sweeney Talks The Housemaid, Christy, and Bonding With Amanda Seyfried</p><p style="text-align:center;">Ph. Tyrone Lebon</p><p style="text-align:center;"><a rel="external nofollow" href="https://www.wmagazine.com/culture/sydney-sweeney-cover-interview-the-housemaid-christy">https://www.wmagazine.com/culture/sydney-sweeney-cover-interview-the-housemaid-christy</a></p><p style="text-align:center;"></p><p style="text-align:center;"><img class="ipsImage ipsImage_thumbnailed ipsRichText__align--block" data-fileid="15813191" src="https://www.bellazon.com/main/uploads/monthly_2026_01/1222250126covershrinstagram2.thumb.jpg.7bfbdc57ebcbfd61e4ba72c2b55dfbf3.jpg" alt="1222250126covershrinstagram2.jpg" title="" width="230" height="300" data-full-image="https://www.bellazon.com/main/uploads/monthly_2026_01/1222250126covershrinstagram2.jpg.9bca664c750694127c5c77c0e99db770.jpg" loading="lazy"><img class="ipsImage ipsImage_thumbnailed ipsRichText__align--block" data-fileid="15813196" src="https://www.bellazon.com/main/uploads/monthly_2026_01/1222250126covershrcms2.thumb.jpg.4ae359d3f0927aca1f7ab6a4d44b47cf.jpg" alt="1222250126covershrcms2.jpg" title="" width="231" height="300" data-full-image="https://www.bellazon.com/main/uploads/monthly_2026_01/1222250126covershrcms2.jpg.a4d33f2e157aec446f9e268cce576ddc.jpg" loading="lazy"><img class="ipsImage ipsImage_thumbnailed ipsRichText__align--block" data-fileid="15813194" src="https://www.bellazon.com/main/uploads/monthly_2026_01/1-0126broadsheetcmslo13-14.thumb.jpg.904162a4ebd4a340d5a595df82e7c982.jpg" alt="1-0126broadsheetcmslo13-14.jpg" title="" width="300" height="194" data-full-image="https://www.bellazon.com/main/uploads/monthly_2026_01/1-0126broadsheetcmslo13-14.jpg.21f087b58d0d3cc5c7d03ea2bb62a979.jpg" loading="lazy"></p>""",
|
||||
"count" : 4,
|
||||
"date" : "dt:2026-01-06 16:34:53",
|
||||
"id" : "6113627",
|
||||
},
|
||||
},
|
||||
|
||||
{
|
||||
"#url" : "https://www.bellazon.com/main/topic/57872-millie-brady/",
|
||||
"#class" : bellazon.BellazonThreadExtractor,
|
||||
|
||||
Reference in New Issue
Block a user