diff --git a/gallery_dl/extractor/2chan.py b/gallery_dl/extractor/2chan.py
index c92969b0..38b2d5a8 100644
--- a/gallery_dl/extractor/2chan.py
+++ b/gallery_dl/extractor/2chan.py
@@ -20,7 +20,7 @@ class _2chanThreadExtractor(Extractor):
     filename_fmt = "{tim}.{extension}"
     archive_fmt = "{board}_{thread}_{tim}"
     url_fmt = "https://{server}.2chan.net/{board}/src/{filename}"
-    pattern = r"(?:https?://)?([^.]+)\.2chan\.net/([^/]+)/res/(\d+)"
+    pattern = r"(?:https?://)?([\w-]+)\.2chan\.net/([^/]+)/res/(\d+)"
     test = ("http://dec.2chan.net/70/res/4752.htm", {
         "url": "f49aa31340e9a3429226af24e19e01f5b819ca1f",
         "keyword": "44599c21b248e79692b2eb2da12699bd0ed5640a",
diff --git a/gallery_dl/extractor/__init__.py b/gallery_dl/extractor/__init__.py
index 4f84d6ab..65c994dc 100644
--- a/gallery_dl/extractor/__init__.py
+++ b/gallery_dl/extractor/__init__.py
@@ -152,6 +152,7 @@ modules = [
     "oauth",
     "test",
     "ytdl",
+    "generic",
 ]
 
 
diff --git a/gallery_dl/extractor/blogger.py b/gallery_dl/extractor/blogger.py
index 7e7c2829..9a86cc47 100644
--- a/gallery_dl/extractor/blogger.py
+++ b/gallery_dl/extractor/blogger.py
@@ -15,7 +15,7 @@ import re
 
 BASE_PATTERN = (
     r"(?:blogger:(?:https?://)?([^/]+)|"
-    r"(?:https?://)?([^.]+\.blogspot\.com))")
+    r"(?:https?://)?([\w-]+\.blogspot\.com))")
 
 
 class BloggerExtractor(Extractor):
diff --git a/gallery_dl/extractor/flickr.py b/gallery_dl/extractor/flickr.py
index 6c5c7dfc..2bd8c6b6 100644
--- a/gallery_dl/extractor/flickr.py
+++ b/gallery_dl/extractor/flickr.py
@@ -56,7 +56,7 @@ class FlickrImageExtractor(FlickrExtractor):
     subcategory = "image"
     pattern = (r"(?:https?://)?(?:"
                r"(?:(?:www\.|m\.)?flickr\.com/photos/[^/]+/"
-               r"|[^.]+\.static\.?flickr\.com/(?:\d+/)+)(\d+)"
+               r"|[\w-]+\.static\.?flickr\.com/(?:\d+/)+)(\d+)"
                r"|flic\.kr/p/([A-Za-z1-9]+))")
     test = (
         ("https://www.flickr.com/photos/departingyyz/16089302239", {
diff --git a/gallery_dl/extractor/generic.py b/gallery_dl/extractor/generic.py
new file mode 100644
index 00000000..bece9057
--- /dev/null
+++ b/gallery_dl/extractor/generic.py
@@ -0,0 +1,208 @@
+# -*- coding: utf-8 -*-
+
+"""Extractor for images in a generic web page."""
+
+from .common import Extractor, Message
+from .. import config, text
+import re
+import os.path
+
+
+class GenericExtractor(Extractor):
+    """Extractor for images in a generic web page."""
+
+    category = "generic"
+    directory_fmt = ("{category}", "{pageurl}")
+    archive_fmt = "{imageurl}"
+
+    # By default, the generic extractor is disabled
+    # and the "g(eneric):" prefix in url is required.
+    # If the extractor is enabled, make the prefix optional
+    pattern = r"(?ix)(?P<generic>g(?:eneric)?:)"
+    if config.get(("extractor", "generic"), "enabled"):
+        pattern += r"?"
+
+    # The generic extractor pattern should match (almost) any valid url
+    # Based on: https://tools.ietf.org/html/rfc3986#appendix-B
+    pattern += r"""
+        (?P<scheme>https?://)?          # optional http(s) scheme
+        (?P<domain>[-\w\.]+)            # required domain
+        (?P<path>/[^?&#]*)?             # optional path
+        (?:\?(?P<query>[^/?#]*))?       # optional query
+        (?:\#(?P<fragment>.*))?$        # optional fragment
+        """
+
+    def __init__(self, match):
+        """Init."""
+        Extractor.__init__(self, match)
+
+        # Strip the "g(eneric):" prefix
+        # and inform about "forced" or "fallback" mode
+        if match.group('generic'):
+            self.log.info("Forcing use of generic information extractor.")
+            self.url = match.group(0).partition(":")[2]
+        else:
+            self.log.info("Falling back on generic information extractor.")
+            self.url = match.group(0)
+
+        # Make sure we have a scheme, or use https
+        if match.group('scheme'):
+            self.scheme = match.group('scheme')
+        else:
+            self.scheme = 'https://'
+            self.url = self.scheme + self.url
+
+        # Used to resolve relative image urls
+        self.root = self.scheme + match.group('domain')
+
+    def items(self):
+        """Get page, extract metadata & images, yield them in suitable messages.
+
+        Adapted from common.GalleryExtractor.items()
+
+        """
+        page = self.request(self.url).text
+        data = self.metadata(page)
+        imgs = self.images(page)
+
+        try:
+            data["count"] = len(imgs)
+        except TypeError:
+            pass
+        images = enumerate(imgs, 1)
+
+        yield Message.Version, 1
+        yield Message.Directory, data
+
+        for data["num"], (url, imgdata) in images:
+            if imgdata:
+                data.update(imgdata)
+                if "extension" not in imgdata:
+                    text.nameext_from_url(url, data)
+            else:
+                text.nameext_from_url(url, data)
+            yield Message.Url, url, data
+
+    def metadata(self, page):
+        """Extract generic webpage metadata, return them in a dict."""
+        data = {}
+        data['pageurl'] = self.url
+        data['title'] = text.extract(page, '<title>', "</title>")[0] or ""
+        data['description'] = text.extract(
+            page, '<meta name="description" content="', '"')[0] or ""
+        data['keywords'] = text.extract(
+            page, '<meta name="keywords" content="', '"')[0] or ""
+        data['language'] = text.extract(
+            page, '<meta name="language" content="', '"')[0] or ""
+        data['name'] = text.extract(
+            page, '<meta itemprop="name" content="', '"')[0] or ""
+        data['copyright'] = text.extract(
+            page, '<meta name="copyright" content="', '"')[0] or ""
+        data['og_site'] = text.extract(
+            page, '<meta property="og:site" content="', '"')[0] or ""
+        data['og_site_name'] = text.extract(
+            page, '<meta property="og:site_name" content="', '"')[0] or ""
+        data['og_title'] = text.extract(
+            page, '<meta property="og:title" content="', '"')[0] or ""
+        data['og_description'] = text.extract(
+            page, '<meta property="og:description" content="', '"')[0] or ""
+
+        data = {k: text.unescape(data[k]) for k in data if data[k] != ""}
+
+        return data
+
+    def images(self, page):
+        """Extract image urls, return a list of (image url, metadata) tuples.
+
+        The extractor aims at finding as many _likely_ image urls as possible,
+        using two strategies (see below); since these often overlap, any
+        duplicate urls will be removed at the end of the process.
+
+        Note: since we are using re.findall() (see below), it's essential that
+        the following patterns contain 0 or at most 1 capturing group, so that
+        re.findall() return a list of urls (instead of a list of tuples of
+        matching groups). All other groups used in the pattern should be
+        non-capturing (?:...).
+
+        1: Look in src/srcset attributes of img/video/source elements
+
+        See:
+        https://www.w3schools.com/tags/att_src.asp
+        https://www.w3schools.com/tags/att_source_srcset.asp
+
+        We allow both absolute and relative urls here.
+
+        Note that srcset attributes often contain multiple space separated
+        image urls; this pattern matches only the first url; remaining urls
+        will be matched by the "imageurl_pattern_ext" pattern below.
+        """
+        imageurl_pattern_src = r"""(?ix)
+            <(?:img|video|source)\s.*?      # <img>, <video> or <source>
+            src(?:set)?=["']?               # src or srcset attributes
+            (?P<URL>[^"'\s>]+)              # url
+            """
+
+        """
+        2: Look anywhere for urls containing common image/video extensions
+
+        The list of allowed extensions is borrowed from the directlink.py
+        extractor; other could be added, see
+        https://en.wikipedia.org/wiki/List_of_file_formats
+
+        Compared to the "pattern" class variable, here we must exclude also
+        other special characters (space, ", ', >), since we are looking for
+        urls in html tags.
+        """
+
+        imageurl_pattern_ext = r"""(?ix)
+            (?:[^?&#"'>\s]+)                    # anything until dot+extension
+            \.(?:jpe?g|jpe|png|gif
+                 |web[mp]|mp4|mkv|og[gmv]|opus) # dot + image/video extensions
+            (?:[^"'>\s]*)?                      # optional query and fragment
+            """
+
+        imageurls_src = re.findall(imageurl_pattern_src, page)
+        imageurls_ext = re.findall(imageurl_pattern_ext, page)
+        imageurls = imageurls_src + imageurls_ext
+
+        # Resolve relative urls
+        #
+        # Image urls catched so far may be relative, so we must resolve them
+        # by prepending a suitable base url.
+        #
+        # If the page contains a <base> element, use it as base url
+        basematch = re.search(
+            r"(?i)(?:<base\s.*?href=[\"']?)(?P<url>[^\"' >]+)", page)
+        if basematch:
+            self.baseurl = basematch.group('url').rstrip('/')
+        # Otherwise, extract the base url from self.url
+        else:
+            if self.url.endswith("/"):
+                self.baseurl = self.url.rstrip('/')
+            else:
+                self.baseurl = os.path.dirname(self.url)
+
+        # Build the list of absolute image urls
+        absimageurls = []
+        for u in imageurls:
+            # Absolute urls are taken as-is
+            if u.startswith('http'):
+                absimageurls.append(u)
+            # // relative urls are prefixed with current scheme
+            elif u.startswith('//'):
+                absimageurls.append(self.scheme + u.lstrip('/'))
+            # / relative urls are prefixed with current scheme+domain
+            elif u.startswith('/'):
+                absimageurls.append(self.root + u)
+            # other relative urls are prefixed with baseurl
+            else:
+                absimageurls.append(self.baseurl + '/' + u)
+
+        # Remove duplicates
+        absimageurls = set(absimageurls)
+
+        # Create the image metadata dict and add imageurl to it
+        # (image filename and extension are added by items())
+        images = [(u, {'imageurl': u}) for u in absimageurls]
+
+        return images
diff --git a/gallery_dl/extractor/imgbb.py b/gallery_dl/extractor/imgbb.py
index 1e875f0b..f32093a3 100644
--- a/gallery_dl/extractor/imgbb.py
+++ b/gallery_dl/extractor/imgbb.py
@@ -169,7 +169,7 @@ class ImgbbAlbumExtractor(ImgbbExtractor):
 class ImgbbUserExtractor(ImgbbExtractor):
     """Extractor for user profiles in imgbb.com"""
     subcategory = "user"
-    pattern = r"(?:https?://)?([^.]+)\.imgbb\.com/?(?:\?([^#]+))?$"
+    pattern = r"(?:https?://)?([\w-]+)\.imgbb\.com/?(?:\?([^#]+))?$"
     test = ("https://folkie.imgbb.com", {
         "range": "1-80",
         "pattern": r"https?://i\.ibb\.co/\w+/[^/?#]+",
diff --git a/gallery_dl/extractor/keenspot.py b/gallery_dl/extractor/keenspot.py
index 40127606..50ce0d3b 100644
--- a/gallery_dl/extractor/keenspot.py
+++ b/gallery_dl/extractor/keenspot.py
@@ -19,7 +19,7 @@ class KeenspotComicExtractor(Extractor):
     directory_fmt = ("{category}", "{comic}")
     filename_fmt = "{filename}.{extension}"
     archive_fmt = "{comic}_{filename}"
-    pattern = r"(?:https?://)?(?!www\.|forums\.)([^.]+)\.keenspot\.com(/.+)?"
+    pattern = r"(?:https?://)?(?!www\.|forums\.)([\w-]+)\.keenspot\.com(/.+)?"
     test = (
         ("http://marksmen.keenspot.com/", {  # link
             "range": "1-3",
diff --git a/gallery_dl/extractor/myportfolio.py b/gallery_dl/extractor/myportfolio.py
index 5c202f3e..f06ab704 100644
--- a/gallery_dl/extractor/myportfolio.py
+++ b/gallery_dl/extractor/myportfolio.py
@@ -20,8 +20,8 @@ class MyportfolioGalleryExtractor(Extractor):
     filename_fmt = "{num:>02}.{extension}"
     archive_fmt = "{user}_{filename}"
     pattern = (r"(?:myportfolio:(?:https?://)?([^/]+)|"
-               r"(?:https?://)?([^.]+\.myportfolio\.com))"
-               r"(/[^/?#]+)?")
+               r"(?:https?://)?([\w-]+\.myportfolio\.com))"
+               r"(/[^/?&#]+)?")
     test = (
         ("https://andrewling.myportfolio.com/volvo-xc-90-hybrid", {
             "url": "acea0690c76db0e5cf267648cefd86e921bc3499",
diff --git a/gallery_dl/extractor/newgrounds.py b/gallery_dl/extractor/newgrounds.py
index a6994016..4351b3ed 100644
--- a/gallery_dl/extractor/newgrounds.py
+++ b/gallery_dl/extractor/newgrounds.py
@@ -420,7 +420,7 @@ class NewgroundsFavoriteExtractor(NewgroundsExtractor):
     """Extractor for posts favorited by a newgrounds user"""
     subcategory = "favorite"
     directory_fmt = ("{category}", "{user}", "Favorites")
-    pattern = (r"(?:https?://)?([^.]+)\.newgrounds\.com"
+    pattern = (r"(?:https?://)?([\w-]+)\.newgrounds\.com"
                r"/favorites(?!/following)(?:/(art|audio|movies))?/?")
     test = (
         ("https://tomfulp.newgrounds.com/favorites/art", {
@@ -475,7 +475,7 @@ class NewgroundsFavoriteExtractor(NewgroundsExtractor):
 class NewgroundsFollowingExtractor(NewgroundsFavoriteExtractor):
     """Extractor for a newgrounds user's favorited users"""
     subcategory = "following"
-    pattern = r"(?:https?://)?([^.]+)\.newgrounds\.com/favorites/(following)"
+    pattern = r"(?:https?://)?([\w-]+)\.newgrounds\.com/favorites/(following)"
     test = ("https://tomfulp.newgrounds.com/favorites/following", {
         "pattern": NewgroundsUserExtractor.pattern,
         "range": "76-125",
diff --git a/gallery_dl/extractor/photobucket.py b/gallery_dl/extractor/photobucket.py
index bea02760..1993ab62 100644
--- a/gallery_dl/extractor/photobucket.py
+++ b/gallery_dl/extractor/photobucket.py
@@ -21,8 +21,8 @@ class PhotobucketAlbumExtractor(Extractor):
     directory_fmt = ("{category}", "{username}", "{location}")
     filename_fmt = "{offset:>03}{pictureId:?_//}_{titleOrFilename}.{extension}"
     archive_fmt = "{id}"
-    pattern = (r"(?:https?://)?((?:[^.]+\.)?photobucket\.com)"
-               r"/user/[^/?#]+/library(?:/[^?#]*)?")
+    pattern = (r"(?:https?://)?((?:[\w-]+\.)?photobucket\.com)"
+               r"/user/[^/?&#]+/library(?:/[^?&#]*)?")
     test = (
         ("https://s369.photobucket.com/user/CrpyLrkr/library", {
             "pattern": r"https?://[oi]+\d+.photobucket.com/albums/oo139/",
@@ -109,9 +109,9 @@ class PhotobucketImageExtractor(Extractor):
     directory_fmt = ("{category}", "{username}")
     filename_fmt = "{pictureId:?/_/}{titleOrFilename}.{extension}"
     archive_fmt = "{username}_{id}"
-    pattern = (r"(?:https?://)?(?:[^.]+\.)?photobucket\.com"
-               r"(?:/gallery/user/([^/?#]+)/media/([^/?#]+)"
-               r"|/user/([^/?#]+)/media/[^?#]+\.html)")
+    pattern = (r"(?:https?://)?(?:[\w-]+\.)?photobucket\.com"
+               r"(?:/gallery/user/([^/?&#]+)/media/([^/?&#]+)"
+               r"|/user/([^/?&#]+)/media/[^?&#]+\.html)")
     test = (
         (("https://s271.photobucket.com/user/lakerfanryan"
           "/media/Untitled-3-1.jpg.html"), {
diff --git a/gallery_dl/extractor/pixnet.py b/gallery_dl/extractor/pixnet.py
index 98928d65..a52071e5 100644
--- a/gallery_dl/extractor/pixnet.py
+++ b/gallery_dl/extractor/pixnet.py
@@ -12,7 +12,7 @@ from .common import Extractor, Message
 from .. import text, exception
 
 
-BASE_PATTERN = r"(?:https?://)?(?!www\.)([^.]+)\.pixnet.net"
+BASE_PATTERN = r"(?:https?://)?(?!www\.)([\w-]+)\.pixnet.net"
 
 
 class PixnetExtractor(Extractor):
diff --git a/gallery_dl/extractor/pornhub.py b/gallery_dl/extractor/pornhub.py
index f976e821..f8497c09 100644
--- a/gallery_dl/extractor/pornhub.py
+++ b/gallery_dl/extractor/pornhub.py
@@ -12,7 +12,7 @@ from .common import Extractor, Message
 from .. import text, exception
 
 
-BASE_PATTERN = r"(?:https?://)?(?:[^.]+\.)?pornhub\.com"
+BASE_PATTERN = r"(?:https?://)?(?:[\w-]+\.)?pornhub\.com"
 
 
 class PornhubExtractor(Extractor):
diff --git a/gallery_dl/extractor/slickpic.py b/gallery_dl/extractor/slickpic.py
index b5fbdc22..7b5982a2 100644
--- a/gallery_dl/extractor/slickpic.py
+++ b/gallery_dl/extractor/slickpic.py
@@ -13,7 +13,7 @@ from .. import text
 import time
 
 
-BASE_PATTERN = r"(?:https?://)?([^.]+)\.slickpic\.com"
+BASE_PATTERN = r"(?:https?://)?([\w-]+)\.slickpic\.com"
 
 
 class SlickpicExtractor(Extractor):
diff --git a/gallery_dl/extractor/smugmug.py b/gallery_dl/extractor/smugmug.py
index 5d582b50..bdf6036f 100644
--- a/gallery_dl/extractor/smugmug.py
+++ b/gallery_dl/extractor/smugmug.py
@@ -13,7 +13,7 @@ from .. import text, oauth, exception
 
 BASE_PATTERN = (
     r"(?:smugmug:(?!album:)(?:https?://)?([^/]+)|"
-    r"(?:https?://)?([^.]+)\.smugmug\.com)")
+    r"(?:https?://)?([\w-]+)\.smugmug\.com)")
 
 
 class SmugmugExtractor(Extractor):
diff --git a/gallery_dl/extractor/tumblr.py b/gallery_dl/extractor/tumblr.py
index 243710d3..358bc954 100644
--- a/gallery_dl/extractor/tumblr.py
+++ b/gallery_dl/extractor/tumblr.py
@@ -35,7 +35,7 @@ POST_TYPES = frozenset((
 
 BASE_PATTERN = (
     r"(?:tumblr:(?:https?://)?([^/]+)|"
-    r"(?:https?://)?([^.]+\.tumblr\.com))")
+    r"(?:https?://)?([\w-]+\.tumblr\.com))")
 
 
 class TumblrExtractor(Extractor):
diff --git a/gallery_dl/extractor/xhamster.py b/gallery_dl/extractor/xhamster.py
index f7a0a7ec..146ab040 100644
--- a/gallery_dl/extractor/xhamster.py
+++ b/gallery_dl/extractor/xhamster.py
@@ -13,7 +13,7 @@ from .. import text
 import json
 
 
-BASE_PATTERN = (r"(?:https?://)?((?:[^.]+\.)?xhamster"
+BASE_PATTERN = (r"(?:https?://)?((?:[\w-]+\.)?xhamster"
                 r"(?:\d?\.(?:com|one|desi)|\.porncache\.net))")