[joyreactor] try to prevent JsonDecodeErrors (#114)
This commit is contained in:
@@ -63,8 +63,15 @@ class JoyreactorExtractor(Extractor):
|
|||||||
def _parse_post(post):
|
def _parse_post(post):
|
||||||
post, _, script = post.partition('<script type="application/ld+json">')
|
post, _, script = post.partition('<script type="application/ld+json">')
|
||||||
images = text.extract_iter(post, '<div class="image">', '</div>')
|
images = text.extract_iter(post, '<div class="image">', '</div>')
|
||||||
script = script[:script.index("</")].strip().replace("\\", "\\\\")
|
script = script[:script.index("</")].strip()
|
||||||
data = json.loads(script)
|
|
||||||
|
try:
|
||||||
|
data = json.loads(script)
|
||||||
|
except ValueError:
|
||||||
|
data = json.loads(script
|
||||||
|
.replace("\\", "\\\\")
|
||||||
|
.replace("\n", "")
|
||||||
|
.replace("\r", ""))
|
||||||
|
|
||||||
num = 0
|
num = 0
|
||||||
date = data["datePublished"]
|
date = data["datePublished"]
|
||||||
|
|||||||
Reference in New Issue
Block a user