[webtoons] small optimization
don't extract the entire 'author_area' and avoid creating a second 'text.extract_from()' object
This commit is contained in:
@@ -92,10 +92,11 @@ class WebtoonsEpisodeExtractor(WebtoonsBase, GalleryExtractor):
|
|||||||
title = extr('<meta property="og:title" content="', '"')
|
title = extr('<meta property="og:title" content="', '"')
|
||||||
descr = extr('<meta property="og:description" content="', '"')
|
descr = extr('<meta property="og:description" content="', '"')
|
||||||
|
|
||||||
author_area = extr('<div class="author_area">', '</div>')
|
if extr('<div class="author_area"', '\n'):
|
||||||
aa_extr = text.extract_from(author_area)
|
username = extr('/creator/', '"')
|
||||||
username = aa_extr('/creator/', '"')
|
author_name = extr('<span>', '</span>')
|
||||||
author_name = aa_extr('<span>', '</span>')
|
else:
|
||||||
|
username = author_name = ""
|
||||||
|
|
||||||
return {
|
return {
|
||||||
"genre" : self.genre,
|
"genre" : self.genre,
|
||||||
|
|||||||
@@ -20,6 +20,22 @@ __tests__ = (
|
|||||||
"42055e44659f6ffc410b3fb6557346dfbb993df3",
|
"42055e44659f6ffc410b3fb6557346dfbb993df3",
|
||||||
"49e1f2def04c6f7a6a3dacf245a1cd9abe77a6a9",
|
"49e1f2def04c6f7a6a3dacf245a1cd9abe77a6a9",
|
||||||
],
|
],
|
||||||
|
|
||||||
|
"author_name" : "Chris McCoy",
|
||||||
|
"comic" : "safely-endangered",
|
||||||
|
"comic_name" : "Safely Endangered",
|
||||||
|
"count" : 5,
|
||||||
|
"description" : "Silly comics for silly people.",
|
||||||
|
"episode" : "572",
|
||||||
|
"episode_name": "Ep. 572 - Earth",
|
||||||
|
"episode_no" : "572",
|
||||||
|
"genre" : "comedy",
|
||||||
|
"lang" : "en",
|
||||||
|
"language" : "English",
|
||||||
|
"num" : range(1, 5),
|
||||||
|
"title" : "Safely Endangered - Ep. 572 - Earth",
|
||||||
|
"title_no" : "352",
|
||||||
|
"username" : "safelyendangered",
|
||||||
},
|
},
|
||||||
|
|
||||||
{
|
{
|
||||||
|
|||||||
Reference in New Issue
Block a user