1
0
mirror of https://github.com/mikf/gallery-dl.git synced 2024-11-23 19:22:32 +01:00
gallery-dl/gallery_dl/extractor
Mike Fährmann 8e1e8a5bea
[soundgasm] rewrite (#3578)
use a more standard extractor structure to make -A work as expected
2023-02-15 16:52:07 +01:00
..
__init__.py split e621 from danbooru module (#3425) 2023-02-03 19:24:31 +01:00
2chan.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
2chen.py [2chen] fix file URLs 2022-12-15 18:05:32 +01:00
3dbooru.py [moebooru] add generalized extractors for moebooru sites 2020-12-01 22:27:18 +01:00
4chan.py remove most 'yield Message.Version' statements 2021-08-16 03:10:48 +02:00
8chan.py update extractor test results 2022-12-08 18:58:29 +01:00
8muses.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
35photo.py update extractor test results 2022-12-08 18:58:29 +01:00
420chan.py [429chan] add 'thread' and 'board' extractors (closes #1773) 2021-08-21 22:46:22 +02:00
500px.py replace json.dumps with direct calls to JSONEncoder.encode 2023-02-09 15:51:40 +01:00
adultempire.py update extractor class hierarchies 2019-10-16 18:15:29 +02:00
architizer.py update extractor test results 2021-07-20 20:21:33 +02:00
artstation.py [artstation] add 'max-posts' option (#3270) 2022-11-23 22:00:18 +01:00
aryion.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
bbc.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
bcy.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
behance.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
blogger.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
booru.py [booru] add 'url' option 2023-01-13 16:32:32 +01:00
bunkr.py [bunkr] fix extraction (#3636, #3655) 2023-02-15 15:42:32 +01:00
catbox.py [catbox] add 'album' extractor (#2410) 2022-08-18 18:00:24 +02:00
comicvine.py [comicvine] add extractor (closes #1712) 2021-07-23 16:17:06 +02:00
common.py [instagram] show -o cursor=… after every error (#3440) 2023-01-23 13:00:44 +01:00
cyberdrop.py [cyberdrop] add fallback URLs (#2668) 2022-06-13 14:19:40 +02:00
danbooru.py [e621] implement 'notes' and 'pools' metadata extraction 2023-02-04 21:20:38 +01:00
desktopography.py [desktopography] simplify (#1740) 2021-09-17 20:09:24 +02:00
deviantart.py merge #3560: [deviantart] add support for /deviation/ and fav.me URLs 2023-01-23 14:16:18 +01:00
directlink.py allow '/' and '?' in URL queries 2022-10-02 19:02:05 +02:00
dynastyscans.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
e621.py [e621] implement 'notes' and 'pools' metadata extraction 2023-02-04 21:20:38 +01:00
erome.py update extractor test results 2022-12-08 18:58:29 +01:00
exhentai.py update extractor test results 2022-12-08 18:58:29 +01:00
fallenangels.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
fanbox.py [fanbox] return 'imageMap' files in order (#2718) 2023-01-01 15:12:05 +01:00
fanleaks.py [fanleaks] update 'model' URL pattern 2022-12-30 19:29:55 +05:30
fantia.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
fapachi.py [fapachi] add 'post' and 'user' extractors (#3347) 2022-12-02 13:54:29 +01:00
fapello.py [fapello] set 'filename_fmt' 2022-12-16 20:57:39 +05:30
flickr.py [flickr] add support for secure.flickr.com (#2910) 2022-09-14 16:19:27 +02:00
foolfuuka.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
foolslide.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
furaffinity.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
fuskator.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
gelbooru_v01.py [gelbooru_v01] remove 'tlb.booru.org' from supported domains 2022-05-10 12:23:05 +02:00
gelbooru_v02.py update extractor test results 2022-12-08 18:58:29 +01:00
gelbooru.py fix 'keywords' in extractor tests (#3491) 2023-01-03 15:14:23 +01:00
generic.py [generic] fix regex for non-src image URLs 2023-01-21 22:32:42 +01:00
gfycat.py [gfycat] cleanup 2022-05-29 15:24:23 +02:00
gofile.py [gofile] fix 401 Unauthorized errors (#2632) 2022-06-01 13:02:34 +02:00
hbrowse.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
hentai2read.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
hentaicosplays.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
hentaifoundry.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
hentaifox.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
hentaihand.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
hentaihere.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
hiperdex.py [hiperdex] update domain (#3572) 2023-01-26 12:01:16 +01:00
hitomi.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
hotleak.py [hotleak] optimize decoding video URLs 2023-01-28 15:41:53 +01:00
idolcomplex.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
imagebam.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
imagechest.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
imagefap.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
imagehosts.py [imagetwist] simplify pattern and add tests 2023-02-06 14:51:57 +01:00
imgbb.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
imgbox.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
imgth.py [imgth] rewrite 2022-12-07 21:19:06 +01:00
imgur.py [imgur] add support for imgur.io URLs 2022-12-17 14:33:44 +08:00
inkbunny.py [inkbunny] provide additional metadata (#3274) 2022-11-22 18:54:22 +01:00
instagram.py [instagram] add 'user' metadata field (#3107) 2023-02-06 14:43:35 +01:00
issuu.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
itaku.py [itaku] remove 'Extreme' rating (#3287) 2022-11-24 11:09:00 +01:00
kabeuchi.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
keenspot.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
kemonoparty.py [kemonoparty] remove MD5 hash extraction (#3531) 2023-01-25 11:10:09 +01:00
khinsider.py [khinsider] fix metadata extraction 2022-12-07 21:36:34 +01:00
komikcast.py [komikcast] update domain and fix extraction 2022-12-06 22:00:23 +01:00
lexica.py [lexica] add 'search' extractor (#3567) 2023-01-28 16:00:32 +01:00
lightroom.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
lineblog.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
livedoor.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
lolisafe.py [bunkr] update domain (#3391) 2022-12-11 23:18:01 +01:00
luscious.py update extractor test results 2022-08-28 00:16:12 +02:00
lynxchan.py [lynxchan/bbw-chan] add 'thread' and 'board' extractors 2022-12-26 20:59:42 +05:30
mangadex.py update extractor test results 2022-12-08 18:58:29 +01:00
mangafox.py [mangafox] extract more metadata (#3167) 2022-12-14 19:56:59 +01:00
mangahere.py update extractor test results 2022-07-12 15:49:22 +02:00
mangakakalot.py update extractor test results 2022-07-12 15:49:22 +02:00
manganelo.py [manganelo] support mobile-only chapters 2023-02-15 00:02:28 +01:00
mangapark.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
mangasee.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
mangoxo.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
mastodon.py [mastodon] add 'num' and 'count' metadata fields (#3517) 2023-01-23 13:10:11 +01:00
mememuseum.py [mememuseum] add 'tag' and 'post' extractors (closes #2264) 2022-02-20 02:15:38 +01:00
message.py remove 'Message.Metadata' (#866) 2021-01-31 02:12:37 +01:00
moebooru.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
myhentaigallery.py [myhentaigallery] handle whitespace before the title tag 2023-01-06 16:33:04 +01:00
myportfolio.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
nana.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
naver.py remove most 'yield Message.Version' statements 2021-08-16 03:10:48 +02:00
naverwebtoon.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
newgrounds.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
nhentai.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
nijie.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
nitter.py fix 'keywords' in extractor tests (#3491) 2023-01-03 15:14:23 +01:00
nozomi.py [nozomi] fix extraction (#3051) 2022-10-14 00:19:37 +02:00
nsfwalbum.py [nsfwalbum] retry all requests when extracting image URLs 2021-07-30 00:23:04 +02:00
nudecollect.py [nudecollect] add 'image' and 'album' extractors 2023-01-26 17:25:33 +05:30
oauth.py [oauth] remove stray 'exit()' (#3628) 2023-02-13 15:58:34 +01:00
paheal.py {paheal[ add proper support for videos (#2892) 2022-09-04 13:30:48 +02:00
patreon.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
philomena.py [philomena] match URLs with www subdomain 2023-01-24 22:43:24 +01:00
photobucket.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
photovogue.py [photovogue] switch to .com, update api endpoint (#2494) 2022-04-27 22:37:53 +02:00
picarto.py [picarto] add 'gallery' extractor (closes #1931) 2021-10-13 01:22:10 +02:00
piczel.py update extractor test results 2022-07-12 15:49:22 +02:00
pillowfort.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
pinterest.py [pinterest] unescape search terms (#3621) 2023-02-15 15:44:20 +01:00
pixiv.py [pixiv] implement 'metadata-bookmark' option (#3417) 2023-01-07 23:19:43 +01:00
pixnet.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
plurk.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
poipiku.py [poipiku] warn about incorrect passwords (#3646) 2023-02-11 15:10:49 +01:00
pornhub.py generic extractor (#735) 2021-12-29 22:39:29 +01:00
pururin.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
reactor.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
readcomiconline.py update extractor test results 2022-07-12 15:49:22 +02:00
recursive.py remove 'extractor.blacklist' context manager 2020-09-11 13:17:35 +02:00
reddit.py [reddit] increase 'id-max' default value (#3397) 2022-12-12 12:10:06 +01:00
redgifs.py [redgifs] support v3 URLs 2023-01-30 20:06:43 +05:30
rule34us.py [rule34us] extract tags per category (#1527) 2021-12-16 00:06:52 +01:00
sankaku.py [sankaku] update URL pattern (#3523) 2023-01-18 21:38:01 +01:00
sankakucomplex.py implement 'util.unique_squence()' 2021-03-02 23:11:08 +01:00
seiga.py [seiga] raise error when redirected to login page (#3401) 2022-12-17 12:52:17 +01:00
senmanga.py remove most 'yield Message.Version' statements 2021-08-16 03:10:48 +02:00
sexcom.py [sex.com] Download videos from cdn (#3408) 2022-12-16 10:16:40 +01:00
shopify.py [shopify] support ohpolly.com 2023-02-01 00:31:12 +05:30
simplyhentai.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
skeb.py [skeb] fix extraction (#3112) 2022-10-29 15:07:21 +02:00
slickpic.py update extractor test results 2022-12-08 18:58:29 +01:00
slideshare.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
smugmug.py update extractor test results 2022-12-08 18:58:29 +01:00
soundgasm.py [soundgasm] rewrite (#3578) 2023-02-15 16:52:07 +01:00
speakerdeck.py remove most 'yield Message.Version' statements 2021-08-16 03:10:48 +02:00
subscribestar.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
tapas.py update extractor test results 2022-08-28 00:16:12 +02:00
tcbscans.py [tcbscans] add 'chapter' and 'manga' extractors 2023-01-06 16:16:31 +05:30
telegraph.py [telegraph] fix extraction when images not in <figure> (#3590) 2023-01-31 22:14:44 +01:00
test.py remove most 'yield Message.Version' statements 2021-08-16 03:10:48 +02:00
toyhouse.py [toyhouse] support 'art' listings (#1546, #2331) 2022-02-27 16:22:50 +01:00
tsumino.py remove most 'yield Message.Version' statements 2021-08-16 03:10:48 +02:00
tumblr.py [tumblr] raise more detailed errors for dashboard-only blogs 2023-02-12 19:38:14 +01:00
tumblrgallery.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
twibooru.py update extractor test results 2022-12-08 18:58:29 +01:00
twitter.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
unsplash.py update extractor test results 2022-12-08 18:58:29 +01:00
uploadir.py [uploadir] use utf-8 filenames (#3162) 2022-11-05 19:03:48 +01:00
vanillarock.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
vichan.py [vichan] recognize board url w/o trailing slash (#3087) 2022-10-24 15:52:54 +02:00
vk.py fix 'keywords' in extractor tests (#3491) 2023-01-03 15:14:23 +01:00
vsco.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
wallhaven.py [wallhaven] update 'user' extractor (#3226) 2022-11-15 17:35:52 +01:00
wallpapercave.py [wallpapercave] add extractor for images (#2205) 2022-02-11 23:44:51 +01:00
warosu.py [warosu] fix and update 2022-12-07 21:23:45 +01:00
weasyl.py replace 'text.extract()' with 'text.extr()' where possible 2022-11-05 01:14:09 +01:00
webmshare.py [webmshare] add 'video' extractor (#2410) 2022-12-14 19:59:07 +01:00
webtoons.py update extractor test results 2022-12-08 18:58:29 +01:00
weibo.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
wikiart.py update extractor test results 2022-04-18 17:24:00 +02:00
wikifeet.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
xhamster.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
xvideos.py replace json.loads with direct calls to JSONDecoder.decode 2023-02-09 15:22:00 +01:00
ytdl.py refactor proxy handling code (#2357) 2022-03-10 23:55:35 +01:00
zerochan.py fix 'keywords' in extractor tests (#3491) 2023-01-03 15:14:23 +01:00