mirror of
https://github.com/mikf/gallery-dl.git
synced 2024-11-22 02:32:33 +01:00
[toondex] add support
This commit is contained in:
parent
59cf4b3884
commit
4d784d1f6f
@ -859,6 +859,12 @@ Consider all listed sites to potentially be NSFW.
|
||||
<td>Galleries</td>
|
||||
<td></td>
|
||||
</tr>
|
||||
<tr>
|
||||
<td>ToonDex</td>
|
||||
<td>https://toondex.net/</td>
|
||||
<td>Chapters, Manga</td>
|
||||
<td></td>
|
||||
</tr>
|
||||
<tr>
|
||||
<td>Toyhouse</td>
|
||||
<td>https://toyhou.se/</td>
|
||||
|
@ -154,6 +154,7 @@ modules = [
|
||||
"tcbscans",
|
||||
"telegraph",
|
||||
"tmohentai",
|
||||
"toondex",
|
||||
"toyhouse",
|
||||
"tsumino",
|
||||
"tumblr",
|
||||
|
120
gallery_dl/extractor/toondex.py
Normal file
120
gallery_dl/extractor/toondex.py
Normal file
@ -0,0 +1,120 @@
|
||||
# -*- coding: utf-8 -*-
|
||||
|
||||
# This program is free software; you can redistribute it and/or modify
|
||||
# it under the terms of the GNU General Public License version 2 as
|
||||
# published by the Free Software Foundation.
|
||||
|
||||
"""Extractors for https://toondex.net/"""
|
||||
|
||||
import re
|
||||
from .common import MangaExtractor, ChapterExtractor
|
||||
from .. import text
|
||||
|
||||
|
||||
BASE_PATTERN = r"(?:https?://)?toondex\.net"
|
||||
|
||||
|
||||
class ToondexBase:
|
||||
"""Base class for Toondex extractors"""
|
||||
|
||||
category = "toondex"
|
||||
root = "https://toondex.net/"
|
||||
|
||||
def get_title(self, page):
|
||||
"""Gets the title of the manga"""
|
||||
title = text.extr(page, "<title>", "</title>")
|
||||
title = text.unescape(title).strip()
|
||||
match = re.search(
|
||||
r"(?:Chapter \d+ \| |Chapter \d+\.\d+ \| |Read )"
|
||||
r"(.+)(?: - (Read Free Online Comics at )?ToonDex)",
|
||||
title,
|
||||
)
|
||||
if match:
|
||||
title = match.group(1)
|
||||
return title
|
||||
|
||||
|
||||
class ToondexChapterExtractor(ToondexBase, ChapterExtractor):
|
||||
"""Extractor for manga chapters from Toondex.net"""
|
||||
|
||||
subcategory = "chapter"
|
||||
directory_fmt = (
|
||||
"{category}",
|
||||
"{manga}",
|
||||
"Chapter-{chapter:03}{chapter_minor}",
|
||||
)
|
||||
archive_fmt = "{chapter:03}{chapter_minor}_{page}"
|
||||
pattern = BASE_PATTERN + r"/comics/([\w\d-]+)\/chapter-(\d+-[\d+]|\d+)/?"
|
||||
example = "https://toondex.net/comics/sex-stopwatch/chapter-1/"
|
||||
|
||||
def __init__(self, match):
|
||||
url = match.group(0)
|
||||
self.gid, self.chapter = match.groups()
|
||||
ChapterExtractor.__init__(self, match, url)
|
||||
|
||||
def metadata(self, page):
|
||||
chapter, sep, minor = self.chapter.partition("-")
|
||||
|
||||
data = {
|
||||
"manga": self.get_title(page),
|
||||
"manga_id": self.gid,
|
||||
"chapter": text.parse_int(chapter),
|
||||
"chapter_id": f"{self.gid}-chapter-{self.chapter}",
|
||||
"chapter_minor": sep + minor,
|
||||
}
|
||||
return data
|
||||
|
||||
def images(self, page):
|
||||
images = []
|
||||
first_img = text.extract(
|
||||
page, '<img\n \n src="', '"'
|
||||
)
|
||||
images.append((first_img[0], None))
|
||||
|
||||
for url in text.extract_iter(page, 'data-src="', '"'):
|
||||
images.append((url, None))
|
||||
|
||||
return images
|
||||
|
||||
|
||||
class ToondexMangaExtractor(ToondexBase, MangaExtractor):
|
||||
"""Extractor for manga from Toondex.net"""
|
||||
|
||||
subcategory = "manga"
|
||||
chapterclass = ToondexChapterExtractor
|
||||
pattern = BASE_PATTERN + r"/comics/([\w\d-]+)/?$"
|
||||
example = "https://Toondex.com/comics/sex-stopwatch"
|
||||
|
||||
def __init__(self, match):
|
||||
url, self.gid = match.group(0), match.group(1)
|
||||
MangaExtractor.__init__(self, match, url)
|
||||
|
||||
def chapters(self, page):
|
||||
chapters = set()
|
||||
|
||||
for chapter_id in text.extract_iter(
|
||||
page, f'href="/comics/{self.gid}/', '/"'
|
||||
):
|
||||
chapters.add(chapter_id)
|
||||
|
||||
title = self.get_title(page)
|
||||
results = []
|
||||
|
||||
for chapter_id in chapters:
|
||||
chapter, sep, minor = chapter_id[8:].partition("-")
|
||||
results.append(
|
||||
(
|
||||
f"{self.root}comics/{self.gid}/{chapter_id}",
|
||||
{
|
||||
"manga_id": self.gid,
|
||||
"chapter_id": chapter_id,
|
||||
"chapter": text.parse_int(chapter),
|
||||
"chapter_minor": sep + minor,
|
||||
"manga": title,
|
||||
"lang": "en",
|
||||
"language": "English",
|
||||
},
|
||||
)
|
||||
)
|
||||
|
||||
return results
|
@ -126,6 +126,7 @@ CATEGORY_MAP = {
|
||||
"tbib" : "The Big ImageBoard",
|
||||
"tcbscans" : "TCB Scans",
|
||||
"tco" : "Twitter t.co",
|
||||
"toondex" : "ToonDex",
|
||||
"tmohentai" : "TMOHentai",
|
||||
"thatpervert" : "ThatPervert",
|
||||
"thebarchive" : "The /b/ Archive",
|
||||
|
Loading…
Reference in New Issue
Block a user