gallery-dl/scripts/supportedsites.py

#!/usr/bin/env python3
# -*- coding: utf-8 -*-

# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License version 2 as
# published by the Free Software Foundation.

"""Generate a Markdown document listing all supported sites"""

import os
import sys
import collections

import util
from gallery_dl import extractor

try:
    from test import results
except ImportError:
    results = None


CATEGORY_MAP = {
    "2chan"          : "Futaba Channel",
    "35photo"        : "35PHOTO",
    "adultempire"    : "Adult Empire",
    "agnph"          : "AGNPH",
    "allgirlbooru"   : "All girl",
    "archivedmoe"    : "Archived.Moe",
    "archiveofsins"  : "Archive of Sins",
    "artstation"     : "ArtStation",
    "aryion"         : "Eka's Portal",
    "atfbooru"       : "ATFBooru",
    "azurlanewiki"   : "Azur Lane Wiki",
    "b4k"            : "arch.b4k.co",
    "baraag"         : "baraag",
    "batoto"         : "BATO.TO",
    "bbc"            : "BBC",
    "cien"           : "Ci-en",
    "comicvine"      : "Comic Vine",
    "coomerparty"    : "Coomer",
    "deltaporno"     : "DeltaPorno",
    "deviantart"     : "DeviantArt",
    "drawfriends"    : "Draw Friends",
    "dynastyscans"   : "Dynasty Reader",
    "e621"           : "e621",
    "e926"           : "e926",
    "e6ai"           : "e6AI",
    "erome"          : "EroMe",
    "e-hentai"       : "E-Hentai",
    "exhentai"       : "ExHentai",
    "fallenangels"   : "Fallen Angels Scans",
    "fanbox"         : "pixivFANBOX",
    "fashionnova"    : "Fashion Nova",
    "furaffinity"    : "Fur Affinity",
    "hatenablog"     : "HatenaBlog",
    "hbrowse"        : "HBrowse",
    "hentai2read"    : "Hentai2Read",
    "hentaicosplays" : "Hentai Cosplay",
    "hentaifoundry"  : "Hentai Foundry",
    "hentaifox"      : "HentaiFox",
    "hentaihand"     : "HentaiHand",
    "hentaihere"     : "HentaiHere",
    "hentaiimg"      : "Hentai Image",
    "hentainexus"    : "HentaiNexus",
    "hitomi"         : "Hitomi.la",
    "horne"          : "horne",
    "idolcomplex"    : "Idol Complex",
    "illusioncardsbooru": "Illusion Game Cards",
    "imagebam"       : "ImageBam",
    "imagefap"       : "ImageFap",
    "imgbb"          : "ImgBB",
    "imgbox"         : "imgbox",
    "imagechest"     : "ImageChest",
    "imgkiwi"        : "IMG.Kiwi",
    "imgth"          : "imgth",
    "imgur"          : "imgur",
    "joyreactor"     : "JoyReactor",
    "itchio"         : "itch.io",
    "jpgfish"        : "JPG Fish",
    "kabeuchi"       : "かべうち",
    "kemonoparty"    : "Kemono",
    "livedoor"       : "livedoor Blog",
    "ohpolly"        : "Oh Polly",
    "omgmiamiswimwear": "Omg Miami Swimwear",
    "mangadex"       : "MangaDex",
    "mangafox"       : "Manga Fox",
    "mangahere"      : "Manga Here",
    "mangakakalot"   : "MangaKakalot",
    "mangalife"      : "MangaLife",
    "manganelo"      : "Manganato",
    "mangapark"      : "MangaPark",
    "mangaread"      : "MangaRead",
    "mangasee"       : "MangaSee",
    "mariowiki"      : "Super Mario Wiki",
    "mastodon.social": "mastodon.social",
    "mediawiki"      : "MediaWiki",
    "micmicidol"     : "MIC MIC IDOL",
    "myhentaigallery": "My Hentai Gallery",
    "myportfolio"    : "Adobe Portfolio",
    "naverwebtoon"   : "NaverWebtoon",
    "nhentai"        : "nhentai",
    "nijie"          : "nijie",
    "nozomi"         : "Nozomi.la",
    "nsfwalbum"      : "NSFWalbum.com",
    "paheal"         : "rule #34",
    "photovogue"     : "PhotoVogue",
    "pidgiwiki"      : "PidgiWiki",
    "pixeldrain"     : "pixeldrain",
    "pornimagesxxx"  : "Porn Image",
    "pornpics"       : "PornPics.com",
    "pornreactor"    : "PornReactor",
    "readcomiconline": "Read Comic Online",
    "rbt"            : "RebeccaBlackTech",
    "redgifs"        : "RedGIFs",
    "rozenarcana"    : "Rozen Arcana",
    "rule34"         : "Rule 34",
    "rule34hentai"   : "Rule34Hentai",
    "rule34us"       : "Rule 34",
    "sankaku"        : "Sankaku Channel",
    "sankakucomplex" : "Sankaku Complex",
    "seiga"          : "Niconico Seiga",
    "senmanga"       : "Sen Manga",
    "sensescans"     : "Sense-Scans",
    "sexcom"         : "Sex.com",
    "simplyhentai"   : "Simply Hentai",
    "slickpic"       : "SlickPic",
    "slideshare"     : "SlideShare",
    "smugmug"        : "SmugMug",
    "speakerdeck"    : "Speaker Deck",
    "steamgriddb"    : "SteamGridDB",
    "subscribestar"  : "SubscribeStar",
    "tbib"           : "The Big ImageBoard",
    "tcbscans"       : "TCB Scans",
    "tco"            : "Twitter t.co",
    "tmohentai"      : "TMOHentai",
    "thatpervert"    : "ThatPervert",
    "thebarchive"    : "The /b/ Archive",
    "thecollection"  : "The /co/llection",
    "tumblrgallery"  : "TumblrGallery",
    "vanillarock"    : "もえぴりあ",
    "vidyart2"       : "/v/idyart2",
    "vidyapics"      : "Vidya Booru",
    "vk"             : "VK",
    "vsco"           : "VSCO",
    "wallpapercave"  : "Wallpaper Cave",
    "webmshare"      : "webmshare",
    "webtoons"       : "Webtoon",
    "wikiart"        : "WikiArt.org",
    "wikigg"         : "wiki.gg",
    "wikimediacommons": "Wikimedia Commons",
    "xbunkr"         : "xBunkr",
    "xhamster"       : "xHamster",
    "xvideos"        : "XVideos",
    "yandere"        : "yande.re",
}

SUBCATEGORY_MAP = {
    ""       : "",
    "art"    : "Art",
    "audio"  : "Audio",
    "doujin" : "Doujin",
    "home"   : "Home Feed",
    "image"  : "individual Images",
    "index"  : "Site Index",
    "info"   : "User Profile Information",
    "issue"  : "Comic Issues",
    "manga"  : "Manga",
    "media"  : "Media Files",
    "note"   : "Images from Notes",
    "popular": "Popular Images",
    "recent" : "Recent Images",
    "search" : "Search Results",
    "status" : "Images from Statuses",
    "tag"    : "Tag Searches",
    "tweets" : "",
    "user"   : "User Profiles",
    "watch"  : "Watches",
    "following"    : "Followed Users",
    "related-pin"  : "related Pins",
    "related-board": "",

    "artstation": {
        "artwork": "Artwork Listings",
        "collections": "",
    },
    "bluesky": {
        "posts": "",
    },
    "coomerparty": {
        "discord"       : "",
        "discord-server": "",
        "posts"         : "",
    },
    "desktopography": {
        "site": "",
    },
    "deviantart": {
        "gallery-search": "Gallery Searches",
        "stash" : "Sta.sh",
        "status": "Status Updates",
        "watch-posts": "",
    },
    "fanbox": {
        "supporting": "Supported User Feed",
        "redirect"  : "Pixiv Redirects",
    },
    "fapello": {
        "path": "Videos, Trending Posts, Popular Videos, Top Models",
    },
    "furaffinity": {
        "submissions": "New Submissions",
    },
    "hatenablog": {
        "archive": "Archive",
        "entry"  : "Individual Posts",
    },
    "hentaifoundry": {
        "story": "",
    },
    "imgur": {
        "favorite-folder": "Favorites Folders",
    },
    "inkbunny": {
        "unread": "Unread Submissions",
    },
    "instagram": {
        "posts": "",
        "saved": "Saved Posts",
        "tagged": "Tagged Posts",
    },
    "kemonoparty": {
        "discord"       : "Discord Servers",
        "discord-server": "",
        "posts"         : "",
    },
    "lensdump": {
        "albums": "",
    },
    "mangadex": {
        "feed" : "Followed Feed",
    },
    "nana": {
        "search": "Favorites, Search Results",
    },
    "nijie": {
        "followed": "Followed Users",
        "nuita" : "Nuita History",
    },
    "pinterest": {
        "board": "",
        "pinit": "pin.it Links",
        "created": "Created Pins",
        "allpins": "All Pins",
    },
    "pixiv": {
        "me"  : "pixiv.me Links",
        "novel-bookmark": "Novel Bookmarks",
        "novel-series": "Novel Series",
        "novel-user": "",
        "pixivision": "pixivision",
        "sketch": "Sketch",
        "work": "individual Images",
    },
    "poringa": {
        "post": "Posts Images",
    },
    "pornhub": {
        "gifs": "",
    },
    "raddle": {
        "usersubmissions": "User Profiles",
        "post"           : "Individual Posts",
        "shorturl"       : "",
    },
    "redgifs": {
        "collections": "",
    },
    "sankaku": {
        "books": "Book Searches",
    },
    "sexcom": {
        "pins": "User Pins",
    },
    "skeb": {
        "following"      : "Followed Creators",
        "following-users": "Followed Users",
    },
    "smugmug": {
        "path": "Images from Users and Folders",
    },
    "steamgriddb": {
        "asset": "Individual Assets",
    },
    "tumblr": {
        "day": "Days",
    },
    "twitter": {
        "media": "Media Timelines",
        "tweets": "",
        "replies": "",
        "community": "",
        "list-members": "List Members",
    },
    "vk": {
        "tagged": "Tagged Photos",
    },
    "vsco": {
        "spaces": "",
    },
    "wallhaven": {
        "collections": "",
        "uploads"    : "",
    },
    "wallpapercave": {
        "image": "individual Images, Search Results",
    },
    "weasyl": {
        "journals"   : "",
        "submissions": "",
    },
    "weibo": {
        "home": "",
        "newvideo": "",
    },
    "wikiart": {
        "artists": "Artist Listings",
    },
}

BASE_MAP = {
    "E621"        : "e621 Instances",
    "foolfuuka"   : "FoolFuuka 4chan Archives",
    "foolslide"   : "FoOlSlide Instances",
    "gelbooru_v01": "Gelbooru Beta 0.1.11",
    "gelbooru_v02": "Gelbooru Beta 0.2",
    "jschan"      : "jschan Imageboards",
    "lolisafe"    : "lolisafe and chibisafe",
    "lynxchan"    : "LynxChan Imageboards",
    "moebooru"    : "Moebooru and MyImouto",
    "szurubooru"  : "szurubooru Instances",
    "urlshortener": "URL Shorteners",
    "vichan"      : "vichan Imageboards",
}

URL_MAP = {
    "blogspot" : "https://www.blogger.com/",
    "wikimedia": "https://www.wikimedia.org/",
}

_OAUTH = '<a href="https://github.com/mikf/gallery-dl#oauth">OAuth</a>'
_COOKIES = '<a href="https://github.com/mikf/gallery-dl#cookies">Cookies</a>'
_APIKEY_DB = ('<a href="https://gdl-org.github.io/docs/configuration.html'
              '#extractor-derpibooru-api-key">API Key</a>')
_APIKEY_WH = ('<a href="https://gdl-org.github.io/docs/configuration.html'
              '#extractor-wallhaven-api-key">API Key</a>')
_APIKEY_WY = ('<a href="https://gdl-org.github.io/docs/configuration.html'
              '#extractor-weasyl-api-key">API Key</a>')

AUTH_MAP = {
    "aibooru"        : "Supported",
    "aryion"         : "Supported",
    "atfbooru"       : "Supported",
    "baraag"         : _OAUTH,
    "bluesky"        : "Supported",
    "booruvar"       : "Supported",
    "coomerparty"    : "Supported",
    "danbooru"       : "Supported",
    "derpibooru"     : _APIKEY_DB,
    "deviantart"     : _OAUTH,
    "e621"           : "Supported",
    "e6ai"           : "Supported",
    "e926"           : "Supported",
    "e-hentai"       : "Supported",
    "exhentai"       : "Supported",
    "fanbox"         : _COOKIES,
    "fantia"         : _COOKIES,
    "flickr"         : _OAUTH,
    "furaffinity"    : _COOKIES,
    "furbooru"       : "API Key",
    "horne"          : "Required",
    "idolcomplex"    : "Supported",
    "imgbb"          : "Supported",
    "inkbunny"       : "Supported",
    "instagram"      : _COOKIES,
    "kemonoparty"    : "Supported",
    "mangadex"       : "Supported",
    "mangoxo"        : "Supported",
    "mastodon.social": _OAUTH,
    "newgrounds"     : "Supported",
    "nijie"          : "Required",
    "patreon"        : _COOKIES,
    "pawoo"          : _OAUTH,
    "pillowfort"     : "Supported",
    "pinterest"      : _COOKIES,
    "pixiv"          : _OAUTH,
    "ponybooru"      : "API Key",
    "reddit"         : _OAUTH,
    "sankaku"        : "Supported",
    "seiga"          : _COOKIES,
    "smugmug"        : _OAUTH,
    "subscribestar"  : "Supported",
    "tapas"          : "Supported",
    "tsumino"        : "Supported",
    "tumblr"         : _OAUTH,
    "twitter"        : "Supported",
    "vipergirls"     : "Supported",
    "wallhaven"      : _APIKEY_WH,
    "weasyl"         : _APIKEY_WY,
    "zerochan"       : "Supported",
}

IGNORE_LIST = (
    "directlink",
    "oauth",
    "recursive",
    "test",
    "ytdl",
    "generic",
)


def domain(cls):
    """Return the domain name associated with an extractor class"""
    try:
        url = sys.modules[cls.__module__].__doc__.split()[-1]
        if url.startswith("http"):
            return url
    except Exception:
        pass

    if hasattr(cls, "root") and cls.root:
        return cls.root + "/"

    url = cls.example
    return url[:url.find("/", 8)+1]


def category_text(c):
    """Return a human-readable representation of a category"""
    return CATEGORY_MAP.get(c) or c.capitalize()


def subcategory_text(c, sc):
    """Return a human-readable representation of a subcategory"""
    if c in SUBCATEGORY_MAP:
        scm = SUBCATEGORY_MAP[c]
        if sc in scm:
            return scm[sc]

    if sc in SUBCATEGORY_MAP:
        return SUBCATEGORY_MAP[sc]

    sc = sc.capitalize()
    if sc.endswith("y"):
        sc = sc[:-1] + "ies"
    elif not sc.endswith("s"):
        sc += "s"
    return sc


def category_key(c):
    """Generate sorting keys by category"""
    return category_text(c[0]).lower()


def subcategory_key(sc):
    """Generate sorting keys by subcategory"""
    return "A" if sc == "issue" else sc


def build_extractor_list():
    """Generate a sorted list of lists of extractor classes"""
    categories = collections.defaultdict(lambda: collections.defaultdict(list))
    default = categories[""]
    domains = {"": ""}

    for extr in extractor._list_classes():
        category = extr.category
        if category in IGNORE_LIST:
            continue
        if category:
            default[category].append(extr.subcategory)
            if category not in domains:
                domains[category] = domain(extr)
        else:
            base = categories[extr.basecategory]
            if not extr.instances:
                base[""].append(extr.subcategory)
                continue
            for category, root, info in extr.instances:
                base[category].append(extr.subcategory)
                if category not in domains:
                    if not root:
                        if category in URL_MAP:
                            root = URL_MAP[category].rstrip("/")
                        elif results:
                            # use domain from first matching test
                            test = results.category(category)[0]
                            root = test["#class"].from_url(test["#url"]).root
                    domains[category] = root + "/"

    # sort subcategory lists
    for base in categories.values():
        for subcategories in base.values():
            subcategories.sort(key=subcategory_key)

    # add e-hentai.org
    default["e-hentai"] = default["exhentai"]
    domains["e-hentai"] = domains["exhentai"].replace("x", "-")

    # add coomer.party
    default["coomerparty"] = default["kemonoparty"]
    domains["coomerparty"] = domains["kemonoparty"].replace("kemono", "coomer")

    # add hentai-cosplays sister sites (hentai-img, porn-images-xxx)
    default["hentaiimg"] = default["hentaicosplays"]
    domains["hentaiimg"] = "https://hentai-img.com/"

    default["pornimagesxxx"] = default["hentaicosplays"]
    domains["pornimagesxxx"] = "https://porn-images-xxx.com/"

    # add manga4life.com
    default["mangalife"] = default["mangasee"]
    domains["mangalife"] = "https://manga4life.com/"

    # add wikifeetx.com
    default["wikifeetx"] = default["wikifeet"]
    domains["wikifeetx"] = "https://www.wikifeetx.com/"

    return categories, domains


# define table columns
COLUMNS = (
    ("Site", 20,
     lambda c, scs, d: category_text(c)),
    ("URL" , 35,
     lambda c, scs, d: d),
    ("Capabilities", 50,
     lambda c, scs, d: ", ".join(subcategory_text(c, sc) for sc in scs
                                 if subcategory_text(c, sc))),
    ("Authentication", 16,
     lambda c, scs, d: AUTH_MAP.get(c, "")),
)


def generate_output(columns, categories, domains):

    thead = []
    append = thead.append
    append("<tr>")
    for column in columns:
        append("    <th>" + column[0] + "</th>")
    append("</tr>")

    tbody = []
    append = tbody.append

    for name, base in categories.items():

        if name and base:
            name = BASE_MAP.get(name) or (name.capitalize() + " Instances")
            append('\n<tr>\n    <td colspan="4"><strong>' +
                   name + '</strong></td>\n</tr>')
            clist = base.items()
        else:
            clist = sorted(base.items(), key=category_key)

        for category, subcategories in clist:
            append("<tr>")
            for column in columns:
                domain = domains[category]
                content = column[2](category, subcategories, domain)
                append("    <td>" + content + "</td>")
            append("</tr>")

    TEMPLATE = """# Supported Sites

<!-- auto-generated by {} -->
Consider all listed sites to potentially be NSFW.

<table>
<thead valign="bottom">
{}
</thead>
<tbody valign="top">
{}
</tbody>
</table>
"""
    return TEMPLATE.format(
        "/".join(os.path.normpath(__file__).split(os.sep)[-2:]),
        "\n".join(thead),
        "\n".join(tbody),
    )


categories, domains = build_extractor_list()
PATH = (sys.argv[1] if len(sys.argv) > 1 else
        util.path("docs", "supportedsites.md"))
with util.lazy(PATH) as fp:
    fp.write(generate_output(COLUMNS, categories, domains))
-												update/cleanup Python dev scripts

- put common code in its own util.py file
- same Python3 shebang for all scripts
- add file docstrings
- fix format string replacement fields in man page template

											
										
										
											2019-04-16 18:16:48 +02:00
+								#!/usr/bin/env python3
 								# -*- coding: utf-8 -*-
-												only rewrite utility files if contents changed

											
										
										
											2023-01-27 18:04:13 +01:00
+								# This program is free software; you can redistribute it and/or modify
 								# it under the terms of the GNU General Public License version 2 as
 								# published by the Free Software Foundation.
-												categorize sites in supportedsites.md by basecategory

											
										
										
											2021-03-12 03:56:54 +01:00
+								"""Generate a Markdown document listing all supported sites"""
-												add a script to automatically build a list of supported sites

											
										
										
											2017-01-15 21:31:21 +01:00
-												add a 'generated by …' comment to supportedsites.rst

											
										
										
											2021-01-22 21:02:12 +01:00
+								import os
-												add a script to automatically build a list of supported sites

											
										
										
											2017-01-15 21:31:21 +01:00
+								import sys
-												simplify build_supportedsites.py

											
										
										
											2019-02-20 19:25:41 +01:00
+								import collections
-												add a script to automatically build a list of supported sites

											
										
										
											2017-01-15 21:31:21 +01:00
-												update/cleanup Python dev scripts

- put common code in its own util.py file
- same Python3 shebang for all scripts
- add file docstrings
- fix format string replacement fields in man page template

											
										
										
											2019-04-16 18:16:48 +02:00
+								import util
 								from gallery_dl import extractor
-												add a script to automatically build a list of supported sites

											
										
										
											2017-01-15 21:31:21 +01:00
-												update scripts/supportedsites.py

											
										
										
											2023-09-11 17:36:44 +02:00
+								try:
 								    from test import results
 								except ImportError:
 								    results = None
-												add a script to automatically build a list of supported sites

											
										
										
											2017-01-15 21:31:21 +01:00
-												improve supportedsites.rst and build script

											
										
										
											2017-04-20 16:56:50 +02:00
+								CATEGORY_MAP = {
-												update supportedsites.rst

											
										
										
											2017-07-15 15:01:30 +02:00
+								    "2chan"          : "Futaba Channel",
-												[35photo] add user-, genre-, and image-extractors (#162)

											
										
										
											2019-03-18 01:11:30 +01:00
+								    "35photo"        : "35PHOTO",
-												[adultempire] add gallery extractor (closes #340)

											
										
										
											2019-07-21 22:29:57 +02:00
+								    "adultempire"    : "Adult Empire",
-												[cien] initial support (#2885, #4103, #5240)

											
										
										
											2024-07-28 19:24:00 +02:00
+								    "agnph"          : "AGNPH",
-												[gelbooru_v01] support some more boorus by default

- https://drawfriends.booru.org/
- https://vidyart.booru.org/
- https://tlb.booru.org/

											
										
										
											2021-03-13 17:48:10 +01:00
+								    "allgirlbooru"   : "All girl",
-												update supportedsites.rst

											
										
										
											2017-07-15 15:01:30 +02:00
+								    "archivedmoe"    : "Archived.Moe",
 								    "archiveofsins"  : "Archive of Sins",
-												check supportedsites.rst in release script

											
										
										
											2018-03-17 15:35:38 +01:00
+								    "artstation"     : "ArtStation",
-												[aryion] add gallery and post extractors (#390, #673)

											
										
										
											2020-04-08 21:38:02 +02:00
+								    "aryion"         : "Eka's Portal",
-												[danbooru] inherit from BaseExtractor

- merge danbooru and e621 code
- support booru.allthefallen.moe (closes #2283)
- remove support for old e621 tag search URLs

											
										
										
											2022-02-11 21:01:51 +01:00
+								    "atfbooru"       : "ATFBooru",
-												[azurlanewiki] supportedsites + test

											
										
										
											2024-02-29 21:49:13 +01:00
+								    "azurlanewiki"   : "Azur Lane Wiki",
-												[foolfuuka] add support for more sites (#18)

- https://arch.b4k.co
- https://archive.whatisthisimnotgoodwithcomputers.com
- https://archive.yeet.net

Notes:
- The name "whatisthisimnotgoodwithcomputers" is way too long ...
- archive.yeet.net is out of date and also blocked by 4chan servers
  - newest threads are 2 weeks old
  - using "https://archive.yeet.net" as Referer header results in
    "403 Forbidden" when accessing 4chan

											
										
										
											2017-09-16 21:11:44 +02:00
+								    "b4k"            : "arch.b4k.co",
-												[mastodon] add access tokens for mastodon.social and baraag.net

(closes #665)

											
										
										
											2020-04-02 22:34:32 +02:00
+								    "baraag"         : "baraag",
-												[bato] rename to 'batoto'

to use the same category name as the previous bato.to site

											
										
										
											2024-01-06 01:49:34 +01:00
+								    "batoto"         : "BATO.TO",
-												[bbc] add 'gallery' and 'programme' extractors (closes #1706)

											
										
										
											2021-07-22 20:37:05 +02:00
+								    "bbc"            : "BBC",
-												[cien] initial support (#2885, #4103, #5240)

											
										
										
											2024-07-28 19:24:00 +02:00
+								    "cien"           : "Ci-en",
-												[comicvine] add extractor (closes #1712)

											
										
										
											2021-07-23 02:01:51 +02:00
+								    "comicvine"      : "Comic Vine",
-												add 'coomer.party' to supported sites (closes #2462)

											
										
										
											2022-04-06 21:27:31 +02:00
+								    "coomerparty"    : "Coomer",
-												[chevereto] support 'img.kiwi' and 'deltaporno.com' (#4664, #1381)

											
										
										
											2023-10-16 18:14:30 +02:00
+								    "deltaporno"     : "DeltaPorno",
-												improve supportedsites.rst and build script

											
										
										
											2017-04-20 16:56:50 +02:00
+								    "deviantart"     : "DeviantArt",
-												[gelbooru_v01] support some more boorus by default

- https://drawfriends.booru.org/
- https://vidyart.booru.org/
- https://tlb.booru.org/

											
										
										
											2021-03-13 17:48:10 +01:00
+								    "drawfriends"    : "Draw Friends",
-												improve supportedsites.rst and build script

											
										
										
											2017-04-20 16:56:50 +02:00
+								    "dynastyscans"   : "Dynasty Reader",
 								    "e621"           : "e621",
-												split e621 from danbooru module (#3425)

											
										
										
											2023-02-03 19:11:54 +01:00
+								    "e926"           : "e926",
-												[E621] support 'e6ai.net' (#4320)

											
										
										
											2023-07-18 18:16:30 +02:00
+								    "e6ai"           : "e6AI",
-												[erome] add extractors for albums, users, searches (closes #409)

											
										
										
											2021-02-07 22:58:19 +01:00
+								    "erome"          : "EroMe",
-												have e-hentai and exhentai on supportedsites.rst (#365)

											
										
										
											2019-08-03 11:42:28 +02:00
+								    "e-hentai"       : "E-Hentai",
 								    "exhentai"       : "ExHentai",
-												improve supportedsites.rst and build script

											
										
										
											2017-04-20 16:56:50 +02:00
+								    "fallenangels"   : "Fallen Angels Scans",
-												update fanbox entry in supportedsites.md

											
										
										
											2021-04-25 19:44:19 +02:00
+								    "fanbox"         : "pixivFANBOX",
-												[shopify] add generic collection and product extractors (#175)

with fashionnova.com  as a default domain

											
										
										
											2019-03-05 22:33:37 +01:00
+								    "fashionnova"    : "Fashion Nova",
-												[furaffinity] add extractors (#284)

											
										
										
											2020-02-11 19:51:24 +01:00
+								    "furaffinity"    : "Fur Affinity",
-												[hatenablog] add support

											
										
										
											2024-01-08 15:29:47 +01:00
+								    "hatenablog"     : "HatenaBlog",
-												improve supportedsites.rst and build script

											
										
										
											2017-04-20 16:56:50 +02:00
+								    "hbrowse"        : "HBrowse",
 								    "hentai2read"    : "Hentai2Read",
-												[hentaicosplays] Add extractor (#1473)


											
										
										
											2021-04-18 20:28:00 +02:00
+								    "hentaicosplays" : "Hentai Cosplay",
-												improve supportedsites.rst and build script

											
										
										
											2017-04-20 16:56:50 +02:00
+								    "hentaifoundry"  : "Hentai Foundry",
-												[hentaifox] add chapter extractor (#160)

											
										
										
											2019-01-28 18:00:32 +01:00
+								    "hentaifox"      : "HentaiFox",
-												[hentaihand] add extractors (closes #605)

											
										
										
											2020-02-18 23:49:59 +01:00
+								    "hentaihand"     : "HentaiHand",
-												improve supportedsites.rst and build script

											
										
										
											2017-04-20 16:56:50 +02:00
+								    "hentaihere"     : "HentaiHere",
-												[hentaicosplays] Add extractor (#1473)


											
										
										
											2021-04-18 20:28:00 +02:00
+								    "hentaiimg"      : "Hentai Image",
-												[hentainexus] restore module (#5275)

revert 97641cd1519f0be905bf3103ca1ff9e22b5387ff

											
										
										
											2024-06-03 22:06:48 +02:00
+								    "hentainexus"    : "HentaiNexus",
-												improve supportedsites.rst and build script

											
										
										
											2017-04-20 16:56:50 +02:00
+								    "hitomi"         : "Hitomi.la",
-												[horne] add support for horne.red (#2700)

											
										
										
											2022-06-25 14:24:46 +02:00
+								    "horne"          : "horne",
-												[idolcomplex] add support for idol.sankakucomplex.com

											
										
										
											2018-01-09 17:52:12 +01:00
+								    "idolcomplex"    : "Idol Complex",
-												categorize sites in supportedsites.md by basecategory

											
										
										
											2021-03-12 03:56:54 +01:00
+								    "illusioncardsbooru": "Illusion Game Cards",
-												improve supportedsites.rst and build script

											
										
										
											2017-04-20 16:56:50 +02:00
+								    "imagebam"       : "ImageBam",
 								    "imagefap"       : "ImageFap",
-												[imgbb] add album extractor (#361)

											
										
										
											2019-07-30 23:02:21 +02:00
+								    "imgbb"          : "ImgBB",
-												improve supportedsites.rst and build script

											
										
										
											2017-04-20 16:56:50 +02:00
+								    "imgbox"         : "imgbox",
-												[imagechest] Add new extractor for ImageChest (#750)

* [imagechest] Add new extractor for ImageChest

* [imagechest] Fix flake8 compliance issues
											
										
										
											2020-05-18 19:02:56 +02:00
+								    "imagechest"     : "ImageChest",
-												[chevereto] support 'img.kiwi' and 'deltaporno.com' (#4664, #1381)

											
										
										
											2023-10-16 18:14:30 +02:00
+								    "imgkiwi"        : "IMG.Kiwi",
-												improve supportedsites.rst and build script

											
										
										
											2017-04-20 16:56:50 +02:00
+								    "imgth"          : "imgth",
 								    "imgur"          : "imgur",
-												[reactor] inherit from BaseExtractor

											
										
										
											2021-11-25 16:18:48 +01:00
+								    "joyreactor"     : "JoyReactor",
-												[itchio] add 'game' extractor (#3923)

											
										
										
											2023-04-26 18:50:09 +02:00
+								    "itchio"         : "itch.io",
-												[jpgchurch] update to 'jpgfish'

											
										
										
											2023-05-25 18:58:51 +02:00
+								    "jpgfish"        : "JPG Fish",
-												[kabeuchi] add 'user' extractor (closes #561)

											
										
										
											2020-03-13 16:45:42 +01:00
+								    "kabeuchi"       : "かべうち",
-												add 'coomer.party' to supported sites (closes #2462)

											
										
										
											2022-04-06 21:27:31 +02:00
+								    "kemonoparty"    : "Kemono",
-												[livedoor] add blog- and post-extractors (#190)

											
										
										
											2019-04-06 16:10:29 +02:00
+								    "livedoor"       : "livedoor Blog",
-												[shopify] support ohpolly.com

											
										
										
											2023-01-31 19:54:41 +01:00
+								    "ohpolly"        : "Oh Polly",
-												[shopify] support omgmiamiswimwear.com (closes #1280)

											
										
										
											2021-04-13 03:05:23 +02:00
+								    "omgmiamiswimwear": "Omg Miami Swimwear",
-												[mangadex] general improvements

- support >100 chapter entries per manga
- custom archive ID format
- detect non-existing chapters

											
										
										
											2018-03-06 14:15:15 +01:00
+								    "mangadex"       : "MangaDex",
-												improve supportedsites.rst and build script

											
										
										
											2017-04-20 16:56:50 +02:00
+								    "mangafox"       : "Manga Fox",
 								    "mangahere"      : "Manga Here",
-												[mangakakalot] Added extractors for MangaKakalot (#876)


											
										
										
											2020-07-13 21:20:09 +02:00
+								    "mangakakalot"   : "MangaKakalot",
-												[mangasee] add support for 'mangalife' (#3086)


											
										
										
											2022-10-21 16:46:36 +02:00
+								    "mangalife"      : "MangaLife",
-												[manganelo] update domain to 'manganato.com'

											
										
										
											2021-05-28 17:52:30 +02:00
+								    "manganelo"      : "Manganato",
-												improve supportedsites.rst and build script

											
										
										
											2017-04-20 16:56:50 +02:00
+								    "mangapark"      : "MangaPark",
-												[mangaread] add 'chapter' and 'manga' extractors

											
										
										
											2022-11-13 11:30:29 +01:00
+								    "mangaread"      : "MangaRead",
-												[mangasee] add 'chapter' and 'manga' extractors

											
										
										
											2021-06-26 23:38:58 +02:00
+								    "mangasee"       : "MangaSee",
-												[wikimedia] generalize (#1443)

- support mediawiki.org
- support mariowiki.com (#3660)

- combine code into a single extractor
  (use prefix as subcategory)
- handle non-wiki instances
- unescape titles

											
										
										
											2024-01-18 15:36:16 +01:00
+								    "mariowiki"      : "Super Mario Wiki",
-												[mastodon] add access tokens for mastodon.social and baraag.net

(closes #665)

											
										
										
											2020-04-02 22:34:32 +02:00
+								    "mastodon.social": "mastodon.social",
-												[wikimedia] generalize (#1443)

- support mediawiki.org
- support mariowiki.com (#3660)

- combine code into a single extractor
  (use prefix as subcategory)
- handle non-wiki instances
- unescape titles

											
										
										
											2024-01-18 15:36:16 +01:00
+								    "mediawiki"      : "MediaWiki",
-												[blogger] inherit from BaseExtractor

- support www.micmicidol.club (#4759)

											
										
										
											2023-11-21 16:52:25 +01:00
+								    "micmicidol"     : "MIC MIC IDOL",
-												[myhentaigallery] update and fix extraction (#1001)

- extract more metadata
- match "/show/" URLs
- complete test results
- fix missing images for lines starting with " <img"
- fix missing comma in supportedsites.py

											
										
										
											2020-09-17 18:06:12 +02:00
+								    "myhentaigallery": "My Hentai Gallery",
-												[myportfolio] add user and gallery extractors (#95)

											
										
										
											2018-07-19 18:56:45 +02:00
+								    "myportfolio"    : "Adobe Portfolio",
-												Support naver webtoon (#1331)

* Support naver webtoon (WIP)

* Apply patch

* Change filename format

* Fill test results

* Fill test result
											
										
										
											2021-03-03 15:21:13 +01:00
+								    "naverwebtoon"   : "NaverWebtoon",
-												improve supportedsites.rst and build script

											
										
										
											2017-04-20 16:56:50 +02:00
+								    "nhentai"        : "nhentai",
 								    "nijie"          : "nijie",
-												[nozomi] add post and tag extractors (#388)

											
										
										
											2019-10-13 22:10:32 +02:00
+								    "nozomi"         : "Nozomi.la",
-												[nsfwalbum] add album extractor (closes #287)

											
										
										
											2019-06-22 22:43:09 +02:00
+								    "nsfwalbum"      : "NSFWalbum.com",
-												[paheal] add tag- and post-extractors (closes #69)

											
										
										
											2018-01-15 16:39:05 +01:00
+								    "paheal"         : "rule #34",
-												update supportedsites.rst

											
										
										
											2021-01-22 19:41:50 +01:00
+								    "photovogue"     : "PhotoVogue",
-												[wikimedia] support 'pidgi.net' and 'bulbapedia.bulbagarden.net' (#5205, #5206)

											
										
										
											2024-02-17 17:27:22 +01:00
+								    "pidgiwiki"      : "PidgiWiki",
-												[pixeldrain] add 'file' and 'album' extractors (#4839)

											
										
										
											2023-11-22 19:01:19 +01:00
+								    "pixeldrain"     : "pixeldrain",
-												[hentaicosplays] Add extractor (#1473)


											
										
										
											2021-04-18 20:28:00 +02:00
+								    "pornimagesxxx"  : "Porn Image",
-												[pornpics] add 'gallery' extractor (#263, #3544, #3654)

											
										
										
											2023-02-17 14:53:12 +01:00
+								    "pornpics"       : "PornPics.com",
-												[reactor] inherit from BaseExtractor

											
										
										
											2021-11-25 16:18:48 +01:00
+								    "pornreactor"    : "PornReactor",
-												improve supportedsites.rst and build script

											
										
										
											2017-04-20 16:56:50 +02:00
+								    "readcomiconline": "Read Comic Online",
-												update supportedsites.rst

											
										
										
											2017-07-24 10:50:40 +02:00
+								    "rbt"            : "RebeccaBlackTech",
-												[redgifs] add image extractor (#724)

											
										
										
											2020-05-10 00:31:42 +02:00
+								    "redgifs"        : "RedGIFs",
-												[foolfuuka] update domains

- remove nyafuu
- add rozenarcana (https://archive.alice.al/)
- add tokyochronos (https://www.tokyochronos.net)

											
										
										
											2022-08-24 12:14:41 +02:00
+								    "rozenarcana"    : "Rozen Arcana",
-												improve supportedsites.rst and build script

											
										
										
											2017-04-20 16:56:50 +02:00
+								    "rule34"         : "Rule 34",
-												[rule34hentai] cleanup

- fix using 'self._posts_rule34hentai'
- fix 'file_url' for posts
- update docs/supportedsites
- add tests

											
										
										
											2023-12-22 00:01:36 +01:00
+								    "rule34hentai"   : "Rule34Hentai",
-												[rule34us] add 'tag' and 'post' extractors (#1527)

											
										
										
											2021-12-12 23:36:16 +01:00
+								    "rule34us"       : "Rule 34",
-												improve supportedsites.rst and build script

											
										
										
											2017-04-20 16:56:50 +02:00
+								    "sankaku"        : "Sankaku Channel",
-												[sankakucomplex] move article extractor to its own module (#258)

											
										
										
											2019-05-27 23:49:23 +02:00
+								    "sankakucomplex" : "Sankaku Complex",
-												improve supportedsites.rst and build script

											
										
										
											2017-04-20 16:56:50 +02:00
+								    "seiga"          : "Niconico Seiga",
 								    "senmanga"       : "Sen Manga",
 								    "sensescans"     : "Sense-Scans",
-												[sexcom] add pin and board extractors (#147)

											
										
										
											2019-04-23 22:10:39 +02:00
+								    "sexcom"         : "Sex.com",
-												[simplyhentai] add gallery extractor (#89)

											
										
										
											2018-05-27 15:25:04 +02:00
+								    "simplyhentai"   : "Simply Hentai",
-												[slickpic] add album extractor (#249)

											
										
										
											2019-06-09 21:59:22 +02:00
+								    "slickpic"       : "SlickPic",
-												[slideshare] improve metadata; flake8

- added 'views' and 'published' keywords
- fixed longer titles and descriptions

											
										
										
											2017-12-13 21:15:05 +01:00
+								    "slideshare"     : "SlideShare",
-												[smugmug] added image and album extractor

just some initial code that still requires a lot of work ...

TODO:
- folders
- old-style albums (which are nearly all of them ...)
- images from users
- OAuth

It could also happen that the API credentials used will become invalid
whenever my 14 day trial period ends (7 days remaining), but that
would just require users to supply their own.

											
										
										
											2018-04-29 21:27:25 +02:00
+								    "smugmug"        : "SmugMug",
-												[speakerdeck] Add a new extractor for speakerdeck.com (#726)


											
										
										
											2020-05-01 22:32:22 +02:00
+								    "speakerdeck"    : "Speaker Deck",
-												[docs] add steamgriddb to supportedsites.md

											
										
										
											2024-01-09 07:22:25 +01:00
+								    "steamgriddb"    : "SteamGridDB",
-												update supportedsites.py (#889, #893)

- mention optional auth access for more sites
- link to OAuth and Cookies sections in README

											
										
										
											2020-07-14 16:18:21 +02:00
+								    "subscribestar"  : "SubscribeStar",
-												categorize sites in supportedsites.md by basecategory

											
										
										
											2021-03-12 03:56:54 +01:00
+								    "tbib"           : "The Big ImageBoard",
-												[tcbscans] add 'chapter' and 'manga' extractors

											
										
										
											2023-01-06 11:33:41 +01:00
+								    "tcbscans"       : "TCB Scans",
-												[urlshortener] add support for bit.ly & t.co

											
										
										
											2023-03-28 18:06:41 +02:00
+								    "tco"            : "Twitter t.co",
-												[tmohentai] simplify + tests

											
										
										
											2023-11-21 20:24:07 +01:00
+								    "tmohentai"      : "TMOHentai",
-												[reactor] support thatpervert.com (closes #2029)

											
										
										
											2021-11-25 16:22:17 +01:00
+								    "thatpervert"    : "ThatPervert",
-												update supportedsites.rst

											
										
										
											2017-07-24 10:50:40 +02:00
+								    "thebarchive"    : "The /b/ Archive",
-												categorize sites in supportedsites.md by basecategory

											
										
										
											2021-03-12 03:56:54 +01:00
+								    "thecollection"  : "The /co/llection",
-												support `tumblrgallery.xyz` (#1298)

* support `tumblrgallery.xyz`

* fix format issues

* Refactor and add post and search page support

* Fix warnings

* Few improvments

* Better file names

* Fix linting errors

* move id closer to the begining of the file name

Co-authored-by: topozorra <none>
											
										
										
											2021-03-03 15:20:47 +01:00
+								    "tumblrgallery"  : "TumblrGallery",
-												[vanillarock] add post and tag extractors (closes #254)

											
										
										
											2019-06-23 22:02:54 +02:00
+								    "vanillarock"    : "もえぴりあ",
-												[gelbooru_v01] 'vidyart' -> 'vidyart2'

											
										
										
											2023-07-14 15:09:39 +02:00
+								    "vidyart2"       : "/v/idyart2",
-												[shimmie2] support 'vidya.pics' (#5632)

											
										
										
											2024-06-06 15:08:56 +02:00
+								    "vidyapics"      : "Vidya Booru",
-												[vk] initial support for albums (#474)

											
										
										
											2021-03-23 18:48:01 +01:00
+								    "vk"             : "VK",
-												[vsco] add user extractor (#331)

											
										
										
											2019-07-22 22:15:36 +02:00
+								    "vsco"           : "VSCO",
-												[wallpapercave] add extractor for images (#2205)


											
										
										
											2022-02-11 23:44:51 +01:00
+								    "wallpapercave"  : "Wallpaper Cave",
-												[webmshare] add 'video' extractor (#2410)

											
										
										
											2022-12-14 19:59:07 +01:00
+								    "webmshare"      : "webmshare",
-												[webtoons] Add a new extractor for webtoons.com (#761)

The webtoons extractor can extract episode and entire comic (all
episodes) from webtoons.com.

All the logic of the extractors should be trivial except for a couple
of kludges needed:

 - `ageGatePass' cookie is always set to avoid possible redirect and stop of
    extraction, especially in the comic extractor
 - The image URLs returned by the episode extractor could not be fetched
   directly and the `Referer:' HTTP header needs to be passed to fetch them

Close #593.
											
										
										
											2020-05-18 19:04:20 +02:00
+								    "webtoons"       : "Webtoon",
-												[wikiart] add extractors (#179)

for
- artists:          https://www.wikiart.org/en/thomas-cole
- artist-listings:  https://www.wikiart.org/en/artists-by-century/12
- artwork-listings: https://www.wikiart.org/en/paintings-by-media/grisaille

											
										
										
											2019-04-02 17:34:57 +02:00
+								    "wikiart"        : "WikiArt.org",
-												[wikimedia] support wiki.gg wikis

											
										
										
											2024-04-09 19:24:01 +02:00
+								    "wikigg"         : "wiki.gg",
-												[wikimedia] update

- rewrite using BaseExtractor
- support most Wiki* domains
- update docs/supportedsites
- add tests

											
										
										
											2024-01-16 22:08:03 +01:00
+								    "wikimediacommons": "Wikimedia Commons",
-												[lolisafe] add support for xbunkr (#3156)


											
										
										
											2022-11-04 16:13:52 +01:00
+								    "xbunkr"         : "xBunkr",
-												[xhamster] add gallery & user extractor (#281)

											
										
										
											2019-06-04 22:23:32 +02:00
+								    "xhamster"       : "xHamster",
-												[xvideos] add user profile extractor (#45)

											
										
										
											2017-11-02 17:28:35 +01:00
+								    "xvideos"        : "XVideos",
-												categorize sites in supportedsites.md by basecategory

											
										
										
											2021-03-12 03:56:54 +01:00
+								    "yandere"        : "yande.re",
-												improve supportedsites.rst and build script

											
										
										
											2017-04-20 16:56:50 +02:00
+								}
 								SUBCATEGORY_MAP = {
-												[urlshortener] add support for bit.ly & t.co

											
										
										
											2023-03-28 18:06:41 +02:00
+								    ""       : "",
-												[toyhouse] support 'art' listings (#1546, #2331)

											
										
										
											2022-02-27 16:22:50 +01:00
+								    "art"    : "Art",
 								    "audio"  : "Audio",
-												[nijie] add favorites extractor

adds support for 'https://nijie.info/user_like_illust_view.php?id=...'

											
										
										
											2018-03-31 18:54:25 +02:00
+								    "doujin" : "Doujin",
-												[fanbox] add 'home' and 'supporting' extractors (#5138)

											
										
										
											2024-02-14 23:25:39 +01:00
+								    "home"   : "Home Feed",
-												improve supportedsites.rst and build script

											
										
										
											2017-04-20 16:56:50 +02:00
+								    "image"  : "individual Images",
-												[nozomi] support '/index-N.html' URLs (closes #1365)

and '/index-Popular-N.html'

											
										
										
											2021-03-11 01:06:47 +01:00
+								    "index"  : "Site Index",
-												[instagram][twitter] rename 'profile' to 'info' (#5262, #3623)

											
										
										
											2024-07-10 15:55:39 +02:00
+								    "info"   : "User Profile Information",
-												remove dashes from subcategory names in supportedsites.rst

											
										
										
											2020-03-24 02:00:50 +01:00
+								    "issue"  : "Comic Issues",
-												improve supportedsites.rst and build script

											
										
										
											2017-04-20 16:56:50 +02:00
+								    "manga"  : "Manga",
-												[toyhouse] support 'art' listings (#1546, #2331)

											
										
										
											2022-02-27 16:22:50 +01:00
+								    "media"  : "Media Files",
-												[misskey] add misskey extractors

											
										
										
											2023-03-01 12:30:56 +01:00
+								    "note"   : "Images from Notes",
-												[booru] add extractors for "Popular" images

											
										
										
											2017-08-24 21:24:51 +02:00
+								    "popular": "Popular Images",
-												[hentaifoundry] add 'popular' and 'recent' extractors

for "Popular Pictures" and "Recent Pictures" listings

											
										
										
											2018-09-22 21:28:16 +02:00
+								    "recent" : "Recent Images",
-												add 'Authentication' column to supportedsites.rst

											
										
										
											2017-06-15 21:06:20 +02:00
+								    "search" : "Search Results",
-												improve supportedsites.rst and build script

											
										
										
											2017-04-20 16:56:50 +02:00
+								    "status" : "Images from Statuses",
-												remove dashes from subcategory names in supportedsites.rst

											
										
										
											2020-03-24 02:00:50 +01:00
+								    "tag"    : "Tag Searches",
-												[nitter] add extractors for Nitter instances (#2696)

											
										
										
											2022-11-15 11:44:16 +01:00
+								    "tweets" : "",
-												change text representation of user extractors to "User Profiles"

											
										
										
											2019-09-22 22:21:48 +02:00
+								    "user"   : "User Profiles",
-												[deviantart] add 'watch' extractor (#794)

											
										
										
											2021-03-17 22:50:02 +01:00
+								    "watch"  : "Watches",
-												update docs/supportedsites

											
										
										
											2023-08-24 15:01:26 +02:00
+								    "following"    : "Followed Users",
-												[pinterest] add extractors for related pins

Related pins can not be accessed by adding a "#related" fragment
to the end of a Pinterest URL, for example:
- https://www.pinterest.com/pin/858146903966145189/#related
- https://www.pinterest.com/g1952849/test-/#related

There are no explicit real URLs for related pins,
using an option to enable them results in "clunky" code,
and a custom "related:<URL>" scheme doesn't feel right either.

											
										
										
											2018-08-15 21:28:27 +02:00
+								    "related-pin"  : "related Pins",
 								    "related-board": "",
-												fix auto-generation of supportedsites.rst

											
										
										
											2020-01-13 22:29:42 +01:00
 								    "artstation": {
 								        "artwork": "Artwork Listings",
-												[artstation] support collections (#146)

https://github.com/mikf/gallery-dl/issues/146#issuecomment-1972101003

											
										
										
											2024-03-01 19:34:08 +01:00
+								        "collections": "",
-												fix auto-generation of supportedsites.rst

											
										
										
											2020-01-13 22:29:42 +01:00
+								    },
-												[bluesky] initial support (#4438, #4708, #4722, #5047)

											
										
										
											2024-02-07 19:09:33 +01:00
+								    "bluesky": {
 								        "posts": "",
 								    },
-												add 'coomer.party' to supported sites (closes #2462)

											
										
										
											2022-04-06 21:27:31 +02:00
+								    "coomerparty": {
 								        "discord"       : "",
 								        "discord-server": "",
-												[kemonoparty] add 'posts' extractor (#5194)

											
										
										
											2024-02-13 15:41:34 +01:00
+								        "posts"         : "",
-												add 'coomer.party' to supported sites (closes #2462)

											
										
										
											2022-04-06 21:27:31 +02:00
+								    },
-												[desktopography] simplify (#1740)

											
										
										
											2021-09-17 20:09:24 +02:00
+								    "desktopography": {
 								        "site": "",
 								    },
-												fix auto-generation of supportedsites.rst

											
										
										
											2020-01-13 22:29:42 +01:00
+								    "deviantart": {
-												[deviantart] add 'gallery-search' extractor (#1695)

											
										
										
											2023-02-22 17:25:31 +01:00
+								        "gallery-search": "Gallery Searches",
-												[deviantart] add extractor for status updates

extract user status updates using the '/user/statuses/' endpoint

											
										
										
											2023-01-17 14:16:25 +01:00
+								        "stash" : "Sta.sh",
 								        "status": "Status Updates",
-												[deviantart] add support for posts from watched users (#794)

											
										
										
											2021-03-22 19:20:08 +01:00
+								        "watch-posts": "",
-												fix auto-generation of supportedsites.rst

											
										
										
											2020-01-13 22:29:42 +01:00
+								    },
-												[fanbox] support pixiv redirects (closes #2122)

											
										
										
											2021-12-24 23:06:42 +01:00
+								    "fanbox": {
-												[fanbox] add 'home' and 'supporting' extractors (#5138)

											
										
										
											2024-02-14 23:25:39 +01:00
+								        "supporting": "Supported User Feed",
 								        "redirect"  : "Pixiv Redirects",
-												[fanbox] support pixiv redirects (closes #2122)

											
										
										
											2021-12-24 23:06:42 +01:00
+								    },
-												[fapello] add 'post', 'user' and 'path' extractors

											
										
										
											2022-12-13 17:03:09 +01:00
+								    "fapello": {
 								        "path": "Videos, Trending Posts, Popular Videos, Top Models",
 								    },
-												[furaffinity] add 'submissions' extractor (#5954)

											
										
										
											2024-08-07 16:28:40 +02:00
+								    "furaffinity": {
 								        "submissions": "New Submissions",
 								    },
-												[hatenablog] add support

											
										
										
											2024-01-08 15:29:47 +01:00
+								    "hatenablog": {
 								        "archive": "Archive",
 								        "entry"  : "Individual Posts",
 								    },
-												[hentaifoundry] add support for stories (closes #734)

											
										
										
											2020-09-27 02:22:23 +02:00
+								    "hentaifoundry": {
 								        "story": "",
 								    },
-												[imgur] add 'favorite-folder' extractor (#4016)

											
										
										
											2023-05-06 14:52:43 +02:00
+								    "imgur": {
 								        "favorite-folder": "Favorites Folders",
 								    },
-												[inkbunny] add 'unread' extractor (#4934)

											
										
										
											2023-12-15 21:20:12 +01:00
+								    "inkbunny": {
 								        "unread": "Unread Submissions",
 								    },
-												[instagram] use 'itertools.chain()'

											
										
										
											2020-03-16 22:57:30 +01:00
+								    "instagram": {
-												[instagram] add 'include' option (closes #1180)

Split the functionality of the old 'user' extractor into separate
'posts' and 'highlights' extractors, which respond to virtual URLs
('/<user>/posts' and '/<user>/highlights')

											
										
										
											2020-12-20 23:20:32 +01:00
+								        "posts": "",
-												[instagram] use 'itertools.chain()'

											
										
										
											2020-03-16 22:57:30 +01:00
+								        "saved": "Saved Posts",
-												update supportedsites.md entry for Instagram

											
										
										
											2021-04-22 22:57:06 +02:00
+								        "tagged": "Tagged Posts",
-												[instagram] use 'itertools.chain()'

											
										
										
											2020-03-16 22:57:30 +01:00
+								    },
-												[kemonoparty] add 'discord' extractor (#1827, #1940)

											
										
										
											2021-10-13 19:33:00 +02:00
+								    "kemonoparty": {
-												[kemonoparty] add 'posts' extractor (#5194)

											
										
										
											2024-02-13 15:41:34 +01:00
+								        "discord"       : "Discord Servers",
-												[kemonoparty] split 'discord' extractor (#1940)

in 'server' and 'channel'

											
										
										
											2021-10-18 04:04:58 +02:00
+								        "discord-server": "",
-												[kemonoparty] add 'posts' extractor (#5194)

											
										
										
											2024-02-13 15:41:34 +01:00
+								        "posts"         : "",
-												[kemonoparty] add 'discord' extractor (#1827, #1940)

											
										
										
											2021-10-13 19:33:00 +02:00
+								    },
-												[lensdump] update

- update docs/supportedsites.md
- add GPL2 header
- use BASE_PATTERN
- improve LensdumpImageExtractor

											
										
										
											2023-05-26 23:39:17 +02:00
+								    "lensdump": {
 								        "albums": "",
 								    },
-												[mangadex] add extractor for a user's followed feed (#1535)

											
										
										
											2021-06-08 02:45:36 +02:00
+								    "mangadex": {
 								        "feed" : "Followed Feed",
 								    },
-												[nana] add 'nana' extractors (#2967)


											
										
										
											2022-10-04 09:23:24 +02:00
+								    "nana": {
 								        "search": "Favorites, Search Results",
 								    },
-												[nijie] support /history_nuita.php listings (closes #2541)

											
										
										
											2022-05-01 17:45:38 +02:00
+								    "nijie": {
-												[nijie] add 'followed' extractor (#3048)

											
										
										
											2022-10-14 12:03:00 +02:00
+								        "followed": "Followed Users",
-												[nijie] support /history_nuita.php listings (closes #2541)

											
										
										
											2022-05-01 17:45:38 +02:00
+								        "nuita" : "Nuita History",
 								    },
-												fix auto-generation of supportedsites.rst

											
										
										
											2020-01-13 22:29:42 +01:00
+								    "pinterest": {
-												[pinterest] add support for getting all boards of a user

(#1205)

											
										
										
											2020-12-29 16:57:03 +01:00
+								        "board": "",
-												fix auto-generation of supportedsites.rst

											
										
										
											2020-01-13 22:29:42 +01:00
+								        "pinit": "pin.it Links",
-												[pinterest] add extractor for created pins (#2452)

											
										
										
											2022-04-01 16:59:58 +02:00
+								        "created": "Created Pins",
-												[pinterest] support 'All Pins' boards (#2855, #3484)

											
										
										
											2023-01-03 19:11:20 +01:00
+								        "allpins": "All Pins",
-												fix auto-generation of supportedsites.rst

											
										
										
											2020-01-13 22:29:42 +01:00
+								    },
 								    "pixiv": {
 								        "me"  : "pixiv.me Links",
-												[pixiv] add 'novel-bookmark' extractor (#4111)

											
										
										
											2023-05-28 16:30:17 +02:00
+								        "novel-bookmark": "Novel Bookmarks",
-												[pixiv] initial 'novel' support (#1241, #4044)

supported URLs are
- https://www.pixiv.net/novel/show.php?id=<ID>
- https://www.pixiv.net/novel/series/<ID>
- https://www.pixiv.net/en/users/<ID>/novels

											
										
										
											2023-05-12 16:01:19 +02:00
+								        "novel-series": "Novel Series",
 								        "novel-user": "",
-												[pixiv] add extractor for 'pixivision' articles (#1672)

											
										
										
											2021-07-07 02:22:44 +02:00
+								        "pixivision": "pixivision",
-												[pixiv] add 'sketch' extractor (#1497)

											
										
										
											2021-10-12 20:50:11 +02:00
+								        "sketch": "Sketch",
-												fix auto-generation of supportedsites.rst

											
										
										
											2020-01-13 22:29:42 +01:00
+								        "work": "individual Images",
 								    },
-												[poringa] add support

											
										
										
											2023-12-21 19:50:54 +01:00
+								    "poringa": {
 								        "post": "Posts Images",
 								    },
-												[pornhub] add 'gif' support (#4463)

											
										
										
											2023-08-29 19:34:27 +02:00
+								    "pornhub": {
 								        "gifs": "",
 								    },
-												[postmill] add support

											
										
										
											2023-12-12 10:54:34 +01:00
+								    "raddle": {
 								        "usersubmissions": "User Profiles",
 								        "post"           : "Individual Posts",
 								        "shorturl"       : "",
 								    },
-												[redgifs] fix syntax for older Python versions

and update docs/supportedsites

											
										
										
											2023-02-18 13:07:40 +01:00
+								    "redgifs": {
 								        "collections": "",
 								    },
-												[sankaku] add support for book searches (closes #1204)

											
										
										
											2020-12-29 17:36:37 +01:00
+								    "sankaku": {
 								        "books": "Book Searches",
 								    },
-												[sexcom] add 'pins' extractor (closes #2265)

											
										
										
											2022-02-04 19:01:24 +01:00
+								    "sexcom": {
 								        "pins": "User Pins",
 								    },
-												[skeb] add extractor for followed users (#5290)

needs 'Authorization' header from browser session
-o headers.Authorization="Bearer ey…"

											
										
										
											2024-03-06 22:43:01 +01:00
+								    "skeb": {
 								        "following"      : "Followed Creators",
 								        "following-users": "Followed Users",
 								    },
-												fix auto-generation of supportedsites.rst

											
										
										
											2020-01-13 22:29:42 +01:00
+								    "smugmug": {
 								        "path": "Images from Users and Folders",
 								    },
-												[docs] add steamgriddb to supportedsites.md

											
										
										
											2024-01-09 07:22:25 +01:00
+								    "steamgriddb": {
 								        "asset": "Individual Assets",
 								    },
-												[tumblr] add 'day' extractor (#3951)

											
										
										
											2023-04-24 22:01:47 +02:00
+								    "tumblr": {
 								        "day": "Days",
 								    },
-												fix auto-generation of supportedsites.rst

											
										
										
											2020-01-13 22:29:42 +01:00
+								    "twitter": {
 								        "media": "Media Timelines",
-												[twitter] improve results for regular user URLs

- continuation of 3346f58a
- use media timeline results (or tweet timeline if retweets are enabled)
  plus search results starting from the last tweet id of the first
  timeline, similar to how Twitter Media Downloader operates
- the old behavior can be forced by appending '/tweets' to a user URL,
  like with '/media' (https://twitter.com/USER/tweets)
  although there should be no need to ever do that

											
										
										
											2022-05-23 18:23:21 +02:00
+								        "tweets": "",
-												[twitter] support '/with_replies' URLs (closes #1833)

											
										
										
											2021-09-10 20:40:43 +02:00
+								        "replies": "",
-												[twitter] support communities (#4913)

											
										
										
											2024-02-13 01:17:13 +01:00
+								        "community": "",
-												[twitter] add 'list-members' extractor (closes #1096)

											
										
										
											2020-11-13 06:47:45 +01:00
+								        "list-members": "List Members",
-												fix auto-generation of supportedsites.rst

											
										
										
											2020-01-13 22:29:42 +01:00
+								    },
-												[8chan] add 'thread' and 'board' extractors (#2938)

											
										
										
											2022-10-09 14:58:13 +02:00
+								    "vk": {
 								        "tagged": "Tagged Photos",
 								    },
-												[vsco] add 'spaces' extractor (#5202)

for spaces listed on a user page

											
										
										
											2024-02-17 18:19:16 +01:00
+								    "vsco": {
 								        "spaces": "",
 								    },
-												[wallhaven] add 'collections' extractor (#1351)

											
										
										
											2021-03-02 01:32:26 +01:00
+								    "wallhaven": {
 								        "collections": "",
-												[wallhaven] update 'user' extractor (#3226)

* [wallhaven] update 'user' extractor

* [wallhaven] update 'configuration.rst'

add 'extractor.wallhaven.include' entry

* [wallhaven] add 'wallhaven.include' in gallery-dl.conf
											
										
										
											2022-11-15 17:35:52 +01:00
+								        "uploads"    : "",
-												fix auto-generation of supportedsites.rst

											
										
										
											2020-01-13 22:29:42 +01:00
+								    },
-												[wallpapercave] add extractor for images (#2205)


											
										
										
											2022-02-11 23:44:51 +01:00
+								    "wallpapercave": {
 								        "image": "individual Images, Search Results",
 								    },
-												[weasyl] update and simplify

- simplify 'pattern' regexps
- parse 'posted_at' as 'date'
- use unaltered 'title' ({title!l:R /_/} to lowercase and replace spaces)

											
										
										
											2020-09-25 23:43:11 +02:00
+								    "weasyl": {
 								        "journals"   : "",
 								        "submissions": "",
 								    },
-												[weibo] support all different 'tabtype' listings (#686, #2601)

											
										
										
											2022-06-03 16:36:22 +02:00
+								    "weibo": {
 								        "home": "",
-												[weibo] support '?tabtype=video' listings (#2601)

											
										
										
											2022-06-12 17:55:23 +02:00
+								        "newvideo": "",
-												[weibo] support all different 'tabtype' listings (#686, #2601)

											
										
										
											2022-06-03 16:36:22 +02:00
+								    },
-												[wallhaven] add 'collections' extractor (#1351)

											
										
										
											2021-03-02 01:32:26 +01:00
+								    "wikiart": {
 								        "artists": "Artist Listings",
 								    },
-												improve supportedsites.rst and build script

											
										
										
											2017-04-20 16:56:50 +02:00
+								}
-												categorize sites in supportedsites.md by basecategory

											
										
										
											2021-03-12 03:56:54 +01:00
+								BASE_MAP = {
-												split e621 from danbooru module (#3425)

											
										
										
											2023-02-03 19:11:54 +01:00
+								    "E621"        : "e621 Instances",
-												categorize sites in supportedsites.md by basecategory

											
										
										
											2021-03-12 03:56:54 +01:00
+								    "foolfuuka"   : "FoolFuuka 4chan Archives",
 								    "foolslide"   : "FoOlSlide Instances",
 								    "gelbooru_v01": "Gelbooru Beta 0.1.11",
 								    "gelbooru_v02": "Gelbooru Beta 0.2",
-												[jschan] add generic jschan extractor

											
										
										
											2022-12-22 23:50:56 +01:00
+								    "jschan"      : "jschan Imageboards",
-												add album extractor for lolisafe/chibisafe instances

- support bunkr.is (closes #2038)
- support zz.ht    (closes #2105)

											
										
										
											2021-12-21 19:24:17 +01:00
+								    "lolisafe"    : "lolisafe and chibisafe",
-												[lynxchan] add generic extractors for lynxchan imageboards (#3394)

* [lynxchan] add generic extractors for lynxchan imageboards

includes kohlchan.net, endchan.org:wq

* [lynxchan] set pop default to empty tuple

* Apply suggestions from code review

Co-authored-by: Mike Fährmann <mike_faehrmann@web.de>
											
										
										
											2022-12-12 13:13:39 +01:00
+								    "lynxchan"    : "LynxChan Imageboards",
-												categorize sites in supportedsites.md by basecategory

											
										
										
											2021-03-12 03:56:54 +01:00
+								    "moebooru"    : "Moebooru and MyImouto",
-												[szurubooru] add 'tag' and 'post' extractors (#3583, #3713)

											
										
										
											2023-03-01 18:20:37 +01:00
+								    "szurubooru"  : "szurubooru Instances",
-												[urlshortener] add support for bit.ly & t.co

											
										
										
											2023-03-28 18:06:41 +02:00
+								    "urlshortener": "URL Shorteners",
-												[vichan] add generic extractors for vichan imageboards

includes 8kun.top, smuglo.li, and wikieat.club

											
										
										
											2022-10-21 14:40:45 +02:00
+								    "vichan"      : "vichan Imageboards",
-												categorize sites in supportedsites.md by basecategory

											
										
										
											2021-03-12 03:56:54 +01:00
+								}
-												[blogger] inherit from BaseExtractor

- support www.micmicidol.club (#4759)

											
										
										
											2023-11-21 16:52:25 +01:00
+								URL_MAP = {
-												[wikimedia] combine most wikimedia.org sites (#1443)

add wikidata.org and wikivoyage.org

											
										
										
											2024-02-10 03:00:58 +01:00
+								    "blogspot" : "https://www.blogger.com/",
 								    "wikimedia": "https://www.wikimedia.org/",
-												[blogger] inherit from BaseExtractor

- support www.micmicidol.club (#4759)

											
										
										
											2023-11-21 16:52:25 +01:00
+								}
-												update docs/supportedsites

- use Markdown with inline HTML instead of reStructuredText
- move file from docs/supportedsites.rst to docs/supportedsites.md
- update Makefile, README, etc

											
										
										
											2021-03-12 03:03:48 +01:00
+								_OAUTH = '<a href="https://github.com/mikf/gallery-dl#oauth">OAuth</a>'
 								_COOKIES = '<a href="https://github.com/mikf/gallery-dl#cookies">Cookies</a>'
-												[docs] update docs/configuration links (#5059, #5369, #5423)

											
										
										
											2024-04-13 02:18:44 +02:00
+								_APIKEY_DB = ('<a href="https://gdl-org.github.io/docs/configuration.html'
 								              '#extractor-derpibooru-api-key">API Key</a>')
 								_APIKEY_WH = ('<a href="https://gdl-org.github.io/docs/configuration.html'
 								              '#extractor-wallhaven-api-key">API Key</a>')
 								_APIKEY_WY = ('<a href="https://gdl-org.github.io/docs/configuration.html'
 								              '#extractor-weasyl-api-key">API Key</a>')
-												update supportedsites.py (#889, #893)

- mention optional auth access for more sites
- link to OAuth and Cookies sections in README

											
										
										
											2020-07-14 16:18:21 +02:00
-												add 'Authentication' column to supportedsites.rst

											
										
										
											2017-06-15 21:06:20 +02:00
+								AUTH_MAP = {
-												update Authentication support in docs

https://github.com/mikf/gallery-dl/pull/3075#issuecomment-1374723412

											
										
										
											2023-01-08 16:55:28 +01:00
+								    "aibooru"        : "Supported",
-												rename 'Authentication' entries in supportedsites.rst

- change 'Optional' to 'Supported'
- use 'OAuth' and 'Cookies' in their own
- add link to weasyl API key option

											
										
										
											2020-10-18 22:18:27 +02:00
+								    "aryion"         : "Supported",
-												[danbooru] inherit from BaseExtractor

- merge danbooru and e621 code
- support booru.allthefallen.moe (closes #2283)
- remove support for old e621 tag search URLs

											
										
										
											2022-02-11 21:01:51 +01:00
+								    "atfbooru"       : "Supported",
-												rename 'Authentication' entries in supportedsites.rst

- change 'Optional' to 'Supported'
- use 'OAuth' and 'Cookies' in their own
- add link to weasyl API key option

											
										
										
											2020-10-18 22:18:27 +02:00
+								    "baraag"         : _OAUTH,
-												[bluesky] initial support (#4438, #4708, #4722, #5047)

											
										
										
											2024-02-07 19:09:33 +01:00
+								    "bluesky"        : "Supported",
-												[docs] complete Authentication info in supportedsites.md

											
										
										
											2024-03-29 02:11:04 +01:00
+								    "booruvar"       : "Supported",
-												add 'coomer.party' to supported sites (closes #2462)

											
										
										
											2022-04-06 21:27:31 +02:00
+								    "coomerparty"    : "Supported",
-												rename 'Authentication' entries in supportedsites.rst

- change 'Optional' to 'Supported'
- use 'OAuth' and 'Cookies' in their own
- add link to weasyl API key option

											
										
										
											2020-10-18 22:18:27 +02:00
+								    "danbooru"       : "Supported",
-												[derpibooru] add search and gallery extractors (#862)

											
										
										
											2021-01-07 18:05:32 +01:00
+								    "derpibooru"     : _APIKEY_DB,
-												rename 'Authentication' entries in supportedsites.rst

- change 'Optional' to 'Supported'
- use 'OAuth' and 'Cookies' in their own
- add link to weasyl API key option

											
										
										
											2020-10-18 22:18:27 +02:00
+								    "deviantart"     : _OAUTH,
 								    "e621"           : "Supported",
-												[docs] complete Authentication info in supportedsites.md

											
										
										
											2024-03-29 02:11:04 +01:00
+								    "e6ai"           : "Supported",
-												split e621 from danbooru module (#3425)

											
										
										
											2023-02-03 19:11:54 +01:00
+								    "e926"           : "Supported",
-												rename 'Authentication' entries in supportedsites.rst

- change 'Optional' to 'Supported'
- use 'OAuth' and 'Cookies' in their own
- add link to weasyl API key option

											
										
										
											2020-10-18 22:18:27 +02:00
+								    "e-hentai"       : "Supported",
 								    "exhentai"       : "Supported",
-												add extractors for fantia and fanbox (#1459)

* add extractors for fantia and fanbox

* appease linter

* make docstrings unique

* [fantia] refactor post extraction

* [fantia] capitalize

* [fantia] improve regex pattern

* code style

* capitalize

* [fanbox] use BASE_PATTERN for url regexes

* [fanbox] refactor metadata and post extraction

* [fanbox] improve url base pattern

* [fanbox] accept creator page links ending with /posts

* [fanbox] more tests

* [fantia] improved pagination

* [fanbox] misc. code logic improvements

* [fantia] finish restructuring pagination code

* [fanbox] avoid making a request for each individual post when processing a creator page

* [fanbox] support embedded videos

* [fanbox] fix errors

* [fanbox] document extractor.fanbox.videos

* [fanbox] handle "article" and "entry" post types, all embeds

* [fanbox] fix downloading of embedded fanbox posts

											
										
										
											2021-04-25 19:39:13 +02:00
+								    "fanbox"         : _COOKIES,
 								    "fantia"         : _COOKIES,
-												rename 'Authentication' entries in supportedsites.rst

- change 'Optional' to 'Supported'
- use 'OAuth' and 'Cookies' in their own
- add link to weasyl API key option

											
										
										
											2020-10-18 22:18:27 +02:00
+								    "flickr"         : _OAUTH,
 								    "furaffinity"    : _COOKIES,
-												[docs] complete Authentication info in supportedsites.md

											
										
										
											2024-03-29 02:11:04 +01:00
+								    "furbooru"       : "API Key",
-												[horne] add support for horne.red (#2700)

											
										
										
											2022-06-25 14:24:46 +02:00
+								    "horne"          : "Required",
-												rename 'Authentication' entries in supportedsites.rst

- change 'Optional' to 'Supported'
- use 'OAuth' and 'Cookies' in their own
- add link to weasyl API key option

											
										
										
											2020-10-18 22:18:27 +02:00
+								    "idolcomplex"    : "Supported",
 								    "imgbb"          : "Supported",
 								    "inkbunny"       : "Supported",
-												[instagram] remove login support

broken feature that I cannot get to work anymore

											
										
										
											2022-11-08 21:48:31 +01:00
+								    "instagram"      : _COOKIES,
-												[kemonoparty] implement login with username & password (#1824)

											
										
										
											2021-09-09 01:02:59 +02:00
+								    "kemonoparty"    : "Supported",
-												[mangadex] implement login with username & password (#1535)

											
										
										
											2021-06-08 02:06:19 +02:00
+								    "mangadex"       : "Supported",
-												rename 'Authentication' entries in supportedsites.rst

- change 'Optional' to 'Supported'
- use 'OAuth' and 'Cookies' in their own
- add link to weasyl API key option

											
										
										
											2020-10-18 22:18:27 +02:00
+								    "mangoxo"        : "Supported",
 								    "mastodon.social": _OAUTH,
 								    "newgrounds"     : "Supported",
-												update supportedsites.py (#889, #893)

- mention optional auth access for more sites
- link to OAuth and Cookies sections in README

											
										
										
											2020-07-14 16:18:21 +02:00
+								    "nijie"          : "Required",
-												rename 'Authentication' entries in supportedsites.rst

- change 'Optional' to 'Supported'
- use 'OAuth' and 'Cookies' in their own
- add link to weasyl API key option

											
										
										
											2020-10-18 22:18:27 +02:00
+								    "patreon"        : _COOKIES,
 								    "pawoo"          : _OAUTH,
-												[pillowfort] implement login with username & password (#846)

											
										
										
											2021-05-19 02:57:36 +02:00
+								    "pillowfort"     : "Supported",
-												[pinterest] only mention cookies for authentication (#1856)

regular login is broken due to CAPTCHA

											
										
										
											2021-09-16 16:36:37 +02:00
+								    "pinterest"      : _COOKIES,
-												[pixiv] update (#1304)

- remove login with username & password
- require a refresh token
- add 'oauth:pixiv' functionality

See also:
- https://github.com/upbit/pixivpy/issues/158
- https://gist.github.com/ZipFile/c9ebedb224406f4f11845ab700124362

											
										
										
											2021-02-12 18:03:06 +01:00
+								    "pixiv"          : _OAUTH,
-												[philomena] add generalized extractors for philomena sites

(closes #1379)

											
										
										
											2021-03-14 16:31:33 +01:00
+								    "ponybooru"      : "API Key",
-												rename 'Authentication' entries in supportedsites.rst

- change 'Optional' to 'Supported'
- use 'OAuth' and 'Cookies' in their own
- add link to weasyl API key option

											
										
										
											2020-10-18 22:18:27 +02:00
+								    "reddit"         : _OAUTH,
-												[sankaku] reimplement login support (#1176, #1182)

											
										
										
											2020-12-17 16:12:59 +01:00
+								    "sankaku"        : "Supported",
-												[seiga] require authentication with 'user_session' cookie (#2372)

Login with username & password would now require entering a 2FA token.

see also https://github.com/danbooru/danbooru/commit/7b009cc893b314a0dec65792143aad97a2d6bf92

											
										
										
											2022-03-11 02:10:15 +01:00
+								    "seiga"          : _COOKIES,
-												rename 'Authentication' entries in supportedsites.rst

- change 'Optional' to 'Supported'
- use 'OAuth' and 'Cookies' in their own
- add link to weasyl API key option

											
										
										
											2020-10-18 22:18:27 +02:00
+								    "smugmug"        : _OAUTH,
 								    "subscribestar"  : "Supported",
-												[tapas] implement login with username & password (#692)

											
										
										
											2021-03-29 23:06:47 +02:00
+								    "tapas"          : "Supported",
-												rename 'Authentication' entries in supportedsites.rst

- change 'Optional' to 'Supported'
- use 'OAuth' and 'Cookies' in their own
- add link to weasyl API key option

											
										
										
											2020-10-18 22:18:27 +02:00
+								    "tsumino"        : "Supported",
 								    "tumblr"         : _OAUTH,
 								    "twitter"        : "Supported",
-												[vipergirls] implement login support (#4166)

											
										
										
											2023-06-13 21:05:09 +02:00
+								    "vipergirls"     : "Supported",
-												rename 'Authentication' entries in supportedsites.rst

- change 'Optional' to 'Supported'
- use 'OAuth' and 'Cookies' in their own
- add link to weasyl API key option

											
										
										
											2020-10-18 22:18:27 +02:00
+								    "wallhaven"      : _APIKEY_WH,
 								    "weasyl"         : _APIKEY_WY,
-												[vipergirls] implement login support (#4166)

											
										
										
											2023-06-13 21:05:09 +02:00
+								    "zerochan"       : "Supported",
-												add 'Authentication' column to supportedsites.rst

											
										
										
											2017-06-15 21:06:20 +02:00
+								}
 								IGNORE_LIST = (
-												simplify build_supportedsites.py

											
										
										
											2019-02-20 19:25:41 +01:00
+								    "directlink",
-												add 'Authentication' column to supportedsites.rst

											
										
										
											2017-06-15 21:06:20 +02:00
+								    "oauth",
-												simplify build_supportedsites.py

											
										
										
											2019-02-20 19:25:41 +01:00
+								    "recursive",
 								    "test",
-												[ytdl] add extractor for sites supported by youtube-dl

(#1680, #878)

Can be used by prefixing any URL with 'ytdl:',
or by setting 'extractor,ytdl.enabled' to 'true'.

											
										
										
											2021-07-10 20:47:33 +02:00
+								    "ytdl",
-												add docs for 'extractor.generic.enabled'

											
										
										
											2021-12-29 22:45:07 +01:00
+								    "generic",
-												add 'Authentication' column to supportedsites.rst

											
										
										
											2017-06-15 21:06:20 +02:00
+								)
-												improve supportedsites.rst and build script

											
										
										
											2017-04-20 16:56:50 +02:00
-												simplify build_supportedsites.py

											
										
										
											2019-02-20 19:25:41 +01:00
+								def domain(cls):
-												[blogger] inherit from BaseExtractor

- support www.micmicidol.club (#4759)

											
										
										
											2023-11-21 16:52:25 +01:00
+								    """Return the domain name associated with an extractor class"""
-												fix supportedsites.py for modules without docstring

(fixes #1332)

											
										
										
											2021-02-21 22:57:37 +01:00
+								    try:
 								        url = sys.modules[cls.__module__].__doc__.split()[-1]
 								        if url.startswith("http"):
 								            return url
 								    except Exception:
 								        pass
-												improve supportedsites.rst and build script

											
										
										
											2017-04-20 16:56:50 +02:00
-												simplify build_supportedsites.py

											
										
										
											2019-02-20 19:25:41 +01:00
+								    if hasattr(cls, "root") and cls.root:
 								        return cls.root + "/"
-												update build_supportedsites.py script

											
										
										
											2018-09-28 12:39:05 +02:00
-												update scripts/supportedsites.py

											
										
										
											2023-09-11 17:36:44 +02:00
+								    url = cls.example
 								    return url[:url.find("/", 8)+1]
-												improve supportedsites.rst and build script

											
										
										
											2017-04-20 16:56:50 +02:00
-												fix supportedsites.py

											
										
										
											2021-02-20 22:31:21 +01:00
+								def category_text(c):
-												simplify build_supportedsites.py

											
										
										
											2019-02-20 19:25:41 +01:00
+								    """Return a human-readable representation of a category"""
 								    return CATEGORY_MAP.get(c) or c.capitalize()
-												update build_supportedsites.py script

											
										
										
											2018-09-28 12:39:05 +02:00
-												improve supportedsites.rst and build script

											
										
										
											2017-04-20 16:56:50 +02:00
-												fix supportedsites.py

											
										
										
											2021-02-20 22:31:21 +01:00
+								def subcategory_text(c, sc):
-												simplify build_supportedsites.py

											
										
										
											2019-02-20 19:25:41 +01:00
+								    """Return a human-readable representation of a subcategory"""
-												fix auto-generation of supportedsites.rst

											
										
										
											2020-01-13 22:29:42 +01:00
+								    if c in SUBCATEGORY_MAP:
 								        scm = SUBCATEGORY_MAP[c]
 								        if sc in scm:
 								            return scm[sc]
-												simplify build_supportedsites.py

											
										
										
											2019-02-20 19:25:41 +01:00
+								    if sc in SUBCATEGORY_MAP:
 								        return SUBCATEGORY_MAP[sc]
-												fix auto-generation of supportedsites.rst

											
										
										
											2020-01-13 22:29:42 +01:00
-												simplify build_supportedsites.py

											
										
										
											2019-02-20 19:25:41 +01:00
+								    sc = sc.capitalize()
-												handle subcategory names ending with 'y'

											
										
										
											2023-01-03 18:51:42 +01:00
+								    if sc.endswith("y"):
 								        sc = sc[:-1] + "ies"
 								    elif not sc.endswith("s"):
 								        sc += "s"
 								    return sc
-												improve supportedsites.rst and build script

											
										
										
											2017-04-20 16:56:50 +02:00
-												fix supportedsites.py

											
										
										
											2021-02-20 22:31:21 +01:00
+								def category_key(c):
-												simplify build_supportedsites.py

											
										
										
											2019-02-20 19:25:41 +01:00
+								    """Generate sorting keys by category"""
-												fix supportedsites.py

											
										
										
											2021-02-20 22:31:21 +01:00
+								    return category_text(c[0]).lower()
-												improve supportedsites.rst and build script

											
										
										
											2017-04-20 16:56:50 +02:00
-												fix supportedsites.py

											
										
										
											2021-02-20 22:31:21 +01:00
+								def subcategory_key(sc):
-												simplify build_supportedsites.py

											
										
										
											2019-02-20 19:25:41 +01:00
+								    """Generate sorting keys by subcategory"""
-												fix supportedsites.py

											
										
										
											2021-02-20 22:31:21 +01:00
+								    return "A" if sc == "issue" else sc
-												update supportedsites.rst

											
										
										
											2017-07-15 15:01:30 +02:00
-												simplify build_supportedsites.py

											
										
										
											2019-02-20 19:25:41 +01:00
+								def build_extractor_list():
 								    """Generate a sorted list of lists of extractor classes"""
-												categorize sites in supportedsites.md by basecategory

											
										
										
											2021-03-12 03:56:54 +01:00
+								    categories = collections.defaultdict(lambda: collections.defaultdict(list))
 								    default = categories[""]
-												[docs:supportedsites] include base categories without instances

											
										
										
											2024-06-02 18:11:30 +02:00
+								    domains = {"": ""}
-												add simple imagehosts to list of supported sites

											
										
										
											2017-04-23 17:08:45 +02:00
-												fix supportedsites.py

											
										
										
											2021-02-20 22:31:21 +01:00
+								    for extr in extractor._list_classes():
 								        category = extr.category
 								        if category in IGNORE_LIST:
-												add 'Authentication' column to supportedsites.rst

											
										
										
											2017-06-15 21:06:20 +02:00
+								            continue
-												fix supportedsites.py

											
										
										
											2021-02-20 22:31:21 +01:00
+								        if category:
-												categorize sites in supportedsites.md by basecategory

											
										
										
											2021-03-12 03:56:54 +01:00
+								            default[category].append(extr.subcategory)
-												fix supportedsites.py

											
										
										
											2021-02-20 22:31:21 +01:00
+								            if category not in domains:
 								                domains[category] = domain(extr)
 								        else:
-												categorize sites in supportedsites.md by basecategory

											
										
										
											2021-03-12 03:56:54 +01:00
+								            base = categories[extr.basecategory]
-												[docs:supportedsites] include base categories without instances

											
										
										
											2024-06-02 18:11:30 +02:00
+								            if not extr.instances:
 								                base[""].append(extr.subcategory)
 								                continue
-												add 'config_instance' method

to allow for a more streamlined access to BaseExtractor instance options

											
										
										
											2024-01-18 03:20:36 +01:00
+								            for category, root, info in extr.instances:
-												categorize sites in supportedsites.md by basecategory

											
										
										
											2021-03-12 03:56:54 +01:00
+								                base[category].append(extr.subcategory)
-												fix supportedsites.py

											
										
										
											2021-02-20 22:31:21 +01:00
+								                if category not in domains:
-												[blogger] inherit from BaseExtractor

- support www.micmicidol.club (#4759)

											
										
										
											2023-11-21 16:52:25 +01:00
+								                    if not root:
 								                        if category in URL_MAP:
 								                            root = URL_MAP[category].rstrip("/")
 								                        elif results:
 								                            # use domain from first matching test
 								                            test = results.category(category)[0]
 								                            root = test["#class"].from_url(test["#url"]).root
-												fix supportedsites.py

											
										
										
											2021-02-20 22:31:21 +01:00
+								                    domains[category] = root + "/"
-												improve supportedsites.rst and build script

											
										
										
											2017-04-20 16:56:50 +02:00
-												fix supportedsites.py

											
										
										
											2021-02-20 22:31:21 +01:00
+								    # sort subcategory lists
-												categorize sites in supportedsites.md by basecategory

											
										
										
											2021-03-12 03:56:54 +01:00
+								    for base in categories.values():
 								        for subcategories in base.values():
 								            subcategories.sort(key=subcategory_key)
-												improve supportedsites.rst and build script

											
										
										
											2017-04-20 16:56:50 +02:00
-												fix supportedsites.py

											
										
										
											2021-02-20 22:31:21 +01:00
+								    # add e-hentai.org
-												categorize sites in supportedsites.md by basecategory

											
										
										
											2021-03-12 03:56:54 +01:00
+								    default["e-hentai"] = default["exhentai"]
-												fix supportedsites.py

											
										
										
											2021-02-20 22:31:21 +01:00
+								    domains["e-hentai"] = domains["exhentai"].replace("x", "-")
-												have e-hentai and exhentai on supportedsites.rst (#365)

											
										
										
											2019-08-03 11:42:28 +02:00
-												add 'coomer.party' to supported sites (closes #2462)

											
										
										
											2022-04-06 21:27:31 +02:00
+								    # add coomer.party
 								    default["coomerparty"] = default["kemonoparty"]
 								    domains["coomerparty"] = domains["kemonoparty"].replace("kemono", "coomer")
-												[hentaicosplays] Add extractor (#1473)


											
										
										
											2021-04-18 20:28:00 +02:00
+								    # add hentai-cosplays sister sites (hentai-img, porn-images-xxx)
 								    default["hentaiimg"] = default["hentaicosplays"]
 								    domains["hentaiimg"] = "https://hentai-img.com/"
 								    default["pornimagesxxx"] = default["hentaicosplays"]
 								    domains["pornimagesxxx"] = "https://porn-images-xxx.com/"
-												[mangasee] add support for 'mangalife' (#3086)


											
										
										
											2022-10-21 16:46:36 +02:00
+								    # add manga4life.com
 								    default["mangalife"] = default["mangasee"]
 								    domains["mangalife"] = "https://manga4life.com/"
-												[wikifeet/wikifeetx] add 'gallery' extractor

											
										
										
											2023-01-16 16:38:45 +01:00
+								    # add wikifeetx.com
 								    default["wikifeetx"] = default["wikifeet"]
 								    domains["wikifeetx"] = "https://www.wikifeetx.com/"
-												fix supportedsites.py

											
										
										
											2021-02-20 22:31:21 +01:00
+								    return categories, domains
-												simplify build_supportedsites.py

											
										
										
											2019-02-20 19:25:41 +01:00
 								# define table columns
 								COLUMNS = (
 								    ("Site", 20,
-												fix supportedsites.py

											
										
										
											2021-02-20 22:31:21 +01:00
+								     lambda c, scs, d: category_text(c)),
-												simplify build_supportedsites.py

											
										
										
											2019-02-20 19:25:41 +01:00
+								    ("URL" , 35,
-												fix supportedsites.py

											
										
										
											2021-02-20 22:31:21 +01:00
+								     lambda c, scs, d: d),
-												simplify build_supportedsites.py

											
										
										
											2019-02-20 19:25:41 +01:00
+								    ("Capabilities", 50,
-												fix supportedsites.py

											
										
										
											2021-02-20 22:31:21 +01:00
+								     lambda c, scs, d: ", ".join(subcategory_text(c, sc) for sc in scs
 								                                 if subcategory_text(c, sc))),
-												simplify build_supportedsites.py

											
										
										
											2019-02-20 19:25:41 +01:00
+								    ("Authentication", 16,
-												fix supportedsites.py

											
										
										
											2021-02-20 22:31:21 +01:00
+								     lambda c, scs, d: AUTH_MAP.get(c, "")),
-												simplify build_supportedsites.py

											
										
										
											2019-02-20 19:25:41 +01:00
+								)
-												update build_supportedsites.py

											
										
										
											2019-01-09 14:21:19 +01:00
-												update docs/supportedsites

- use Markdown with inline HTML instead of reStructuredText
- move file from docs/supportedsites.rst to docs/supportedsites.md
- update Makefile, README, etc

											
										
										
											2021-03-12 03:03:48 +01:00
+								def generate_output(columns, categories, domains):
-												add mastodon/foolslide/foolfuuka examples to example config

											
										
										
											2019-02-05 16:17:25 +01:00
-												update docs/supportedsites

- use Markdown with inline HTML instead of reStructuredText
- move file from docs/supportedsites.rst to docs/supportedsites.md
- update Makefile, README, etc

											
										
										
											2021-03-12 03:03:48 +01:00
+								    thead = []
 								    append = thead.append
 								    append("<tr>")
 								    for column in columns:
 								        append("    <th>" + column[0] + "</th>")
 								    append("</tr>")
-												update handling of extractor URL patterns

When loading extractor classes during 'extractor.find(…)', their
'pattern' attribute will be replaced with a compiled version of itself.

											
										
										
											2019-02-08 20:08:16 +01:00
-												update docs/supportedsites

- use Markdown with inline HTML instead of reStructuredText
- move file from docs/supportedsites.rst to docs/supportedsites.md
- update Makefile, README, etc

											
										
										
											2021-03-12 03:03:48 +01:00
+								    tbody = []
 								    append = tbody.append
-												categorize sites in supportedsites.md by basecategory

											
										
										
											2021-03-12 03:56:54 +01:00
 								    for name, base in categories.items():
 								        if name and base:
 								            name = BASE_MAP.get(name) or (name.capitalize() + " Instances")
 								            append('\n<tr>\n    <td colspan="4"><strong>' +
 								                   name + '</strong></td>\n</tr>')
-												do not sort BaseExtractor instances by name

											
										
										
											2022-02-10 01:44:16 +01:00
+								            clist = base.items()
 								        else:
 								            clist = sorted(base.items(), key=category_key)
-												categorize sites in supportedsites.md by basecategory

											
										
										
											2021-03-12 03:56:54 +01:00
 								        for category, subcategories in clist:
 								            append("<tr>")
 								            for column in columns:
 								                domain = domains[category]
 								                content = column[2](category, subcategories, domain)
 								                append("    <td>" + content + "</td>")
 								            append("</tr>")
-												update docs/supportedsites

- use Markdown with inline HTML instead of reStructuredText
- move file from docs/supportedsites.rst to docs/supportedsites.md
- update Makefile, README, etc

											
										
										
											2021-03-12 03:03:48 +01:00
 								    TEMPLATE = """# Supported Sites
 								<!-- auto-generated by {} -->
-												[docs] reword NSFW warning

											
										
										
											2023-12-15 17:51:21 +01:00
+								Consider all listed sites to potentially be NSFW.
-												update docs/supportedsites

- use Markdown with inline HTML instead of reStructuredText
- move file from docs/supportedsites.rst to docs/supportedsites.md
- update Makefile, README, etc

											
										
										
											2021-03-12 03:03:48 +01:00
 								<table>
 								<thead valign="bottom">
 								{}
 								</thead>
 								<tbody valign="top">
 								{}
 								</tbody>
 								</table>
 								"""
 								    return TEMPLATE.format(
 								        "/".join(os.path.normpath(__file__).split(os.sep)[-2:]),
 								        "\n".join(thead),
 								        "\n".join(tbody),
 								    )
-												improve supportedsites.rst and build script

											
										
										
											2017-04-20 16:56:50 +02:00
-												add a script to automatically build a list of supported sites

											
										
										
											2017-01-15 21:31:21 +01:00
-												fix supportedsites.py

											
										
										
											2021-02-20 22:31:21 +01:00
+								categories, domains = build_extractor_list()
-												only rewrite utility files if contents changed

											
										
										
											2023-01-27 18:04:13 +01:00
+								PATH = (sys.argv[1] if len(sys.argv) > 1 else
 								        util.path("docs", "supportedsites.md"))
-												consistent 'with open(…) as fp:' syntax

											
										
										
											2024-06-14 01:22:00 +02:00
+								with util.lazy(PATH) as fp:
 								    fp.write(generate_output(COLUMNS, categories, domains))