[sankaku] match URLs with 'www' subdomain (#5907)

This commit is contained in:
Mike Fährmann
2024-07-30 17:05:22 +02:00
parent 279854cd9e
commit 84eefeebd6
2 changed files with 13 additions and 1 deletions

View File

@@ -16,7 +16,7 @@ import collections
import re
BASE_PATTERN = r"(?:https?://)?" \
r"(?:(?:chan|beta|black|white)\.sankakucomplex\.com|sankaku\.app)" \
r"(?:(?:chan|www|beta|black|white)\.sankakucomplex\.com|sankaku\.app)" \
r"(?:/[a-z]{2})?"

View File

@@ -17,6 +17,12 @@ __tests__ = (
"#count" : 5,
},
{
"#url" : "https://www.sankakucomplex.com/?tags=bonocho",
"#category": ("booru", "sankaku", "tag"),
"#class" : sankaku.SankakuTagExtractor,
},
{
"#url" : "https://beta.sankakucomplex.com/?tags=bonocho",
"#category": ("booru", "sankaku", "tag"),
@@ -99,6 +105,12 @@ __tests__ = (
"#count" : 5,
},
{
"#url" : "https://www.sankakucomplex.com/books/90",
"#category": ("booru", "sankaku", "pool"),
"#class" : sankaku.SankakuPoolExtractor,
},
{
"#url" : "https://beta.sankakucomplex.com/books/90",
"#category": ("booru", "sankaku", "pool"),