1
0
mirror of https://github.com/mikf/gallery-dl.git synced 2024-11-23 19:22:32 +01:00
gallery-dl/gallery_dl/extractor
2023-05-28 16:30:17 +02:00
..
__init__.py [lensdump] add lensdump.com extractor 2023-05-26 03:22:23 -04:00
2chan.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
2chen.py [2chen] update domain to sturdychan.help 2023-04-19 13:54:44 +02:00
3dbooru.py
4chan.py
4chanarchives.py [4chanarchives] add end condition for 'board' extractor (#4012) 2023-05-06 20:52:45 +02:00
8chan.py update extractor test results 2022-12-08 18:58:29 +01:00
8muses.py merge #3329: [8muses] Add 'parts' to album data 2023-05-25 16:31:29 +02:00
35photo.py update extractor test results 2022-12-08 18:58:29 +01:00
500px.py replace json.dumps with direct calls to JSONEncoder.encode 2023-02-09 15:51:40 +01:00
adultempire.py
architizer.py
artstation.py [artstation] add 'max-posts' option (#3270) 2022-11-23 22:00:18 +01:00
aryion.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
bbc.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
bcy.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
behance.py [behance] 'items()' -> 'values()' 2023-04-30 13:53:51 +02:00
blogger.py [blogger] update sub regex 2023-04-03 12:43:58 +05:30
booru.py [booru] add 'url' option 2023-01-13 16:32:32 +01:00
bunkr.py [bunkr] update domain to 'bunkr.la' 2023-03-28 20:10:36 +02:00
catbox.py [catbox] add 'file' extractor (#3570) 2023-02-15 19:50:26 +01:00
comicvine.py
common.py allow for GalleryExtractors to skip loading gallery_url 2023-05-22 22:29:30 +02:00
cyberdrop.py [cyberdrop] add fallback URLs (#2668) 2022-06-13 14:19:40 +02:00
danbooru.py [danbooru] refactor pagination logic (#4002) 2023-05-14 18:39:59 +02:00
desktopography.py [desktopography] simplify (#1740) 2021-09-17 20:09:24 +02:00
deviantart.py [deviantart] revert e9353c63; retry downloads with private token 2023-04-23 21:10:16 +02:00
directlink.py [generic] revert pattern change 2023-03-09 22:25:23 +01:00
dynastyscans.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
e621.py [danbooru] refactor pagination logic (#4002) 2023-05-14 18:39:59 +02:00
erome.py replace remaining time.sleep() calls 2023-02-23 00:35:37 +01:00
exhentai.py [exhentai] remove and update sad panda check 2023-05-03 17:39:49 +02:00
fallenangels.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
fanbox.py [fanbox] skip 404ed or otherwise invalid posts (#4088) 2023-05-22 18:49:06 +02:00
fanleaks.py [fanleaks] update 'model' URL pattern 2022-12-30 19:29:55 +05:30
fantia.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
fapachi.py [fapachi] add 'post' and 'user' extractors (#3347) 2022-12-02 13:54:29 +01:00
fapello.py [fapello] set 'filename_fmt' 2022-12-16 20:57:39 +05:30
flickr.py [flickr] add support for secure.flickr.com (#2910) 2022-09-14 16:19:27 +02:00
foolfuuka.py [foolfuuka] add 'archive.palanq.win' 2023-05-02 19:58:55 +02:00
foolslide.py [foolslide] remove 'sensescans.com' 2023-05-02 20:09:04 +02:00
furaffinity.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
fuskator.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
gelbooru_v01.py [gelbooru_v01] remove 'tlb.booru.org' from supported domains 2022-05-10 12:23:05 +02:00
gelbooru_v02.py [realbooru] fix extraction 2023-04-02 20:45:16 +02:00
gelbooru.py [gelbooru] fix --range for favorites (#3704) 2023-03-23 22:58:13 +01:00
generic.py [generic] write regular expressions without 'x' flags 2023-04-10 20:45:23 +02:00
gfycat.py [gfycat] cleanup 2022-05-29 15:24:23 +02:00
gofile.py [gofile] automatically fetch 'website-token' by default 2023-05-20 17:00:27 +02:00
hbrowse.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
hentai2read.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
hentaicosplays.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
hentaifoundry.py [hentaifoundry] do not update filters when cookies are provided 2023-04-13 14:16:53 +02:00
hentaifox.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
hentaihand.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
hentaihere.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
hiperdex.py [hiperdex] fix extraction 2023-03-25 18:18:27 +01:00
hitomi.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
hotleak.py Fix indentation 2023-04-03 13:44:14 +00:00
idolcomplex.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
imagebam.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
imagechest.py [imagechest] update 2023-05-22 22:42:16 +02:00
imagefap.py [imagefap] extract 'categories' metadata and fix empty 'tags' 2023-04-17 14:49:50 +02:00
imagehosts.py [imxto] fix 'gallery' extraction 2023-04-30 15:23:13 +02:00
imgbb.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
imgbox.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
imgth.py [imgth] rewrite 2022-12-07 21:19:06 +01:00
imgur.py [imgur] fix internal image/album URLs 2023-05-06 15:13:38 +02:00
inkbunny.py [inkbunny] provide additional metadata (#3274) 2022-11-22 18:54:22 +01:00
instagram.py [instagram] add 'metadata' option (#3107) 2023-05-27 15:51:13 +02:00
issuu.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
itaku.py [itaku] remove 'Extreme' rating (#3287) 2022-11-24 11:09:00 +01:00
itchio.py [itchio] add 'game' extractor (#3923) 2023-04-26 19:20:43 +02:00
jpgfish.py [jpgfish] simplify and improve 2023-05-25 22:58:42 +02:00
kabeuchi.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
keenspot.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
kemonoparty.py [kemonoparty] fix kemono and coomer logins using the same cache 2023-05-26 13:35:02 +02:00
khinsider.py [khinsider] fix metadata extraction 2022-12-07 21:36:34 +01:00
komikcast.py [komikcast] update domain and fix extraction 2022-12-06 22:00:23 +01:00
lensdump.py [lensdump] update 2023-05-26 23:39:17 +02:00
lexica.py [lexica] add 'search' extractor (#3567) 2023-01-28 16:00:32 +01:00
lightroom.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
lineblog.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
livedoor.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
lolisafe.py [bunkr] update domain (#3391) 2022-12-11 23:18:01 +01:00
luscious.py update extractor test results 2022-08-28 00:16:12 +02:00
lynxchan.py [lynxchan/bbw-chan] add 'thread' and 'board' extractors 2022-12-26 20:59:42 +05:30
mangadex.py [mangadex] update links to API docs 2023-05-24 12:32:13 +02:00
mangafox.py [mangafox] extract more metadata (#3167) 2022-12-14 19:56:59 +01:00
mangahere.py update extractor test results 2022-07-12 15:49:22 +02:00
mangakakalot.py update extractor test results 2022-07-12 15:49:22 +02:00
manganelo.py [manganelo] match more minor version separators (#3972) 2023-04-27 13:12:11 +02:00
mangapark.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
mangaread.py [mangaread] fix 'tags' extraction 2023-05-25 17:04:20 +02:00
mangasee.py [mangasee] extract 'author' and 'genre' metadata (#3703) 2023-02-26 14:12:19 +01:00
mangoxo.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
mastodon.py [mastodon] try to get account IDs without access token 2023-04-13 14:03:23 +02:00
mememuseum.py [mememuseum] add 'tag' and 'post' extractors (closes #2264) 2022-02-20 02:15:38 +01:00
message.py
misskey.py [misskey] update 2023-05-23 22:17:17 +02:00
moebooru.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
myhentaigallery.py [myhentaigallery] handle whitespace before the title tag 2023-01-06 16:33:04 +01:00
myportfolio.py remove '&' from URL patterns part 2 2023-05-03 20:26:25 +02:00
naver.py
naverwebtoon.py [naverwebtoon] fix extraction (#3729) 2023-03-19 17:08:58 +01:00
newgrounds.py [newgrounds] add default delay between requests (#4046) 2023-05-11 16:04:37 +02:00
nhentai.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
nijie.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
nitter.py [nitter] extract user IDs from encoded banner URLs 2023-04-23 19:13:27 +02:00
nozomi.py [nozomi] update file URLs (#3925) 2023-04-17 15:42:42 +02:00
nsfwalbum.py [nsfwalbum] detect placeholder images 2023-05-17 15:18:10 +02:00
nudecollect.py [nudecollect] add 'image' and 'album' extractors 2023-01-26 17:25:33 +05:30
oauth.py remove '*' indicating keyword-only arguments 2023-05-02 22:23:33 +02:00
paheal.py [shimmie2] add generic extractors for Shimmie2 sites (#3734) 2023-04-26 19:20:44 +02:00
patreon.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
philomena.py [philomena] match URLs with www subdomain 2023-01-24 22:43:24 +01:00
photobucket.py replace remaining instances of base64 with binascii 2023-03-02 18:25:47 +01:00
photovogue.py [photovogue] switch to .com, update api endpoint (#2494) 2022-04-27 22:37:53 +02:00
picarto.py [picarto] add 'gallery' extractor (closes #1931) 2021-10-13 01:22:10 +02:00
piczel.py update extractor test results 2022-07-12 15:49:22 +02:00
pillowfort.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
pinterest.py remove '&' from URL patterns part 2 2023-05-03 20:26:25 +02:00
pixiv.py [pixiv] add 'novel-bookmark' extractor (#4111) 2023-05-28 16:30:17 +02:00
pixnet.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
plurk.py replace remaining time.sleep() calls 2023-02-23 00:35:37 +01:00
poipiku.py [poipiku] extract full 'descriptions' (#4066) 2023-05-15 23:16:31 +02:00
pornhub.py generic extractor (#735) 2021-12-29 22:39:29 +01:00
pornpics.py [pornpics] support '/pornstar' and '/channels' listings 2023-02-18 22:38:21 +01:00
pururin.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
reactor.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
readcomiconline.py update extractor test results 2022-07-12 15:49:22 +02:00
recursive.py
reddit.py [reddit] simplify and add tests 2023-05-25 13:15:11 +02:00
redgifs.py [redgifs] fix syntax for older Python versions 2023-02-18 13:07:40 +01:00
rule34us.py [rule34us] extract tags per category (#1527) 2021-12-16 00:06:52 +01:00
sankaku.py [sankaku] support post URLs with MD5 hashes (#3952) 2023-04-23 16:46:40 +02:00
sankakucomplex.py remove '&' from URL patterns part 2 2023-05-03 20:26:25 +02:00
seiga.py [seiga] raise error when redirected to login page (#3401) 2022-12-17 12:52:17 +01:00
senmanga.py
sexcom.py [sexcom] fix fetching HD videos 2023-04-13 15:40:53 +02:00
shimmie2.py [shimmie2] add generic extractors for Shimmie2 sites (#3734) 2023-04-26 19:20:44 +02:00
shopify.py [shopify] fix 'collection' extractor 2023-04-03 12:19:09 +05:30
simplyhentai.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
skeb.py [skeb] fix extraction (#3112) 2022-10-29 15:07:21 +02:00
slickpic.py update extractor test results 2022-12-08 18:58:29 +01:00
slideshare.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
smugmug.py update extractor test results 2022-12-08 18:58:29 +01:00
soundgasm.py [soundgasm] rewrite (#3578) 2023-02-15 16:52:07 +01:00
speakerdeck.py
subscribestar.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
szurubooru.py [szurubooru] add 'tag' and 'post' extractors (#3583, #3713) 2023-03-01 18:47:10 +01:00
tapas.py update extractor test results 2022-08-28 00:16:12 +02:00
tcbscans.py [tcbscans] update domain to 'tcbscans.com' (#4080) 2023-05-20 13:59:35 +02:00
telegraph.py [telegraph] fix extraction when images not in <figure> (#3590) 2023-01-31 22:14:44 +01:00
test.py
toyhouse.py [toyhouse] support 'art' listings (#1546, #2331) 2022-02-27 16:22:50 +01:00
tsumino.py
tumblr.py [tumblr] add 'day' extractor (#3951) 2023-04-24 22:01:47 +02:00
tumblrgallery.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
twibooru.py update extractor test results 2022-12-08 18:58:29 +01:00
twitter.py [twitter] optimize '_extract_twitpic()' 2023-05-25 15:18:49 +02:00
unsplash.py update extractor test results 2022-12-08 18:58:29 +01:00
uploadir.py [uploadir] use utf-8 filenames (#3162) 2022-11-05 19:03:48 +01:00
urlshortener.py remove '&' from URL patterns part 2 2023-05-03 20:26:25 +02:00
vanillarock.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
vichan.py [vichan] recognize board url w/o trailing slash (#3087) 2022-10-24 15:52:54 +02:00
vipergirls.py [vipergirls] add 'thread' and 'post' extractors 2023-04-19 15:28:26 +02:00
vk.py fix 'keywords' in extractor tests (#3491) 2023-01-03 15:14:23 +01:00
vsco.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
wallhaven.py [wallhaven] update 'user' extractor (#3226) 2022-11-15 17:35:52 +01:00
wallpapercave.py [wallpapercave] add extractor for images (#2205) 2022-02-11 23:44:51 +01:00
warosu.py [warosu] fix and update 2022-12-07 21:23:45 +01:00
weasyl.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
webmshare.py [webmshare] add 'video' extractor (#2410) 2022-12-14 19:59:07 +01:00
webtoons.py update extractor test results 2022-12-08 18:58:29 +01:00
weibo.py [weibo] require numeric IDs to have length >= 10 (#4059) 2023-05-14 18:45:37 +02:00
wikiart.py update extractor test results 2022-04-18 17:24:00 +02:00
wikifeet.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
xhamster.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
xvideos.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
ytdl.py refactor proxy handling code (#2357) 2022-03-10 23:55:35 +01:00
zerochan.py fix 'keywords' in extractor tests (#3491) 2023-01-03 15:14:23 +01:00