[komikcast] fix extraction
... again
This commit is contained in:
@@ -82,14 +82,14 @@ class KomikcastMangaExtractor(KomikcastBase, MangaExtractor):
|
|||||||
test = (
|
test = (
|
||||||
("https://komikcast.com/komik/090-eko-to-issho/", {
|
("https://komikcast.com/komik/090-eko-to-issho/", {
|
||||||
"url": "dc798d107697d1f2309b14ca24ca9dba30c6600f",
|
"url": "dc798d107697d1f2309b14ca24ca9dba30c6600f",
|
||||||
"keyword": "3db7e23e3c108031608fbbeb9334badecd967f95",
|
"keyword": "837a7e96867344ff59d840771c04c20dc46c0ab1",
|
||||||
}),
|
}),
|
||||||
("https://komikcast.com/tonari-no-kashiwagi-san/"),
|
("https://komikcast.com/tonari-no-kashiwagi-san/"),
|
||||||
)
|
)
|
||||||
|
|
||||||
def chapters(self, page):
|
def chapters(self, page):
|
||||||
results = []
|
results = []
|
||||||
data = self.get_metadata(page)
|
data = self.metadata(page)
|
||||||
|
|
||||||
for item in text.extract_iter(
|
for item in text.extract_iter(
|
||||||
page, '<span class="leftoff"><a href="', '</a>'):
|
page, '<span class="leftoff"><a href="', '</a>'):
|
||||||
@@ -99,16 +99,16 @@ class KomikcastMangaExtractor(KomikcastBase, MangaExtractor):
|
|||||||
return results
|
return results
|
||||||
|
|
||||||
@staticmethod
|
@staticmethod
|
||||||
def get_metadata(page):
|
def metadata(page):
|
||||||
"""Return a dict with general metadata"""
|
"""Return a dict with general metadata"""
|
||||||
manga , pos = text.extract(page, "<title>", "</title>")
|
manga , pos = text.extract(page, "<title>" , "</title>")
|
||||||
author, pos = text.extract(page, "<th>Author</th><td>", "</td>", pos)
|
genres, pos = text.extract(page, ">Genres:", "</span>", pos)
|
||||||
genres, pos = text.extract(page, "<th>Genres </th><td>", "</td>", pos)
|
author, pos = text.extract(page, ">Author:", "</span>", pos)
|
||||||
mtype , pos = text.extract(page, "<th>Type </th><td>", "</td>", pos)
|
mtype , pos = text.extract(page, ">Type:" , "</span>", pos)
|
||||||
|
|
||||||
return {
|
return {
|
||||||
"manga": text.unescape(manga.rpartition(" - ")[0]),
|
"manga": text.unescape(manga.rpartition(" - ")[0]),
|
||||||
"author": text.unescape(author),
|
"author": text.remove_html(author),
|
||||||
"genres": text.remove_html(genres).replace(" , ", ", "),
|
"genres": text.split_html(genres)[::2],
|
||||||
"type": text.remove_html(mtype),
|
"type": text.remove_html(mtype),
|
||||||
}
|
}
|
||||||
|
|||||||
Reference in New Issue
Block a user