remove '&' from URL patterns
'/?&#' -> '/?#' and '?&#' -> '?#' According to https://www.ietf.org/rfc/rfc3986.txt, URLs are "organized hierarchically" by using "the slash ("/"), question mark ("?"), and number sign ("#") characters to delimit components"
This commit is contained in:
@@ -56,7 +56,7 @@ class GfycatUserExtractor(GfycatExtractor):
|
||||
"""Extractor for gfycat user profiles"""
|
||||
subcategory = "user"
|
||||
directory_fmt = ("{category}", "{userName}")
|
||||
pattern = r"(?:https?://)?gfycat\.com/@([^/?&#]+)"
|
||||
pattern = r"(?:https?://)?gfycat\.com/@([^/?#]+)"
|
||||
test = ("https://gfycat.com/@gretta", {
|
||||
"pattern": r"https://giant\.gfycat\.com/[A-Za-z]+\.mp4",
|
||||
"count": ">= 100",
|
||||
@@ -70,7 +70,7 @@ class GfycatSearchExtractor(GfycatExtractor):
|
||||
"""Extractor for gfycat search results"""
|
||||
subcategory = "search"
|
||||
directory_fmt = ("{category}", "Search", "{search}")
|
||||
pattern = r"(?:https?://)?gfycat\.com/gifs/search/([^/?&#]+)"
|
||||
pattern = r"(?:https?://)?gfycat\.com/gifs/search/([^/?#]+)"
|
||||
test = ("https://gfycat.com/gifs/search/funny+animals", {
|
||||
"pattern": r"https://\w+\.gfycat\.com/[A-Za-z]+\.mp4",
|
||||
"archive": False,
|
||||
|
||||
Reference in New Issue
Block a user