1
0
mirror of https://github.com/mikf/gallery-dl.git synced 2024-11-22 02:32:33 +01:00

[imagechest] Add new extractor for ImageChest (#750)

* [imagechest] Add new extractor for ImageChest

* [imagechest] Fix flake8 compliance issues
This commit is contained in:
Bepis 2020-05-19 03:02:56 +10:00 committed by GitHub
parent b7ebf51229
commit 7b5711ee04
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
3 changed files with 68 additions and 0 deletions

View File

@ -48,6 +48,7 @@ modules = [
"hypnohub",
"idolcomplex",
"imagebam",
"imagechest",
"imagefap",
"imgbb",
"imgbox",

View File

@ -0,0 +1,66 @@
# -*- coding: utf-8 -*-
# Copyright 2014-2020 Leonid "Bepis" Pavel
#
# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License version 2 as
# published by the Free Software Foundation.
"""Extract images from galleries at https://imgchest.com/"""
from .common import GalleryExtractor
from .. import text, exception
import re
class ImagechestGalleryExtractor(GalleryExtractor):
"""Extractor for image galleries from imgchest.com"""
category = "imagechest"
root = "https://imgchest.com"
pattern = r"(?:https?://)?(?:www\.)?imgchest\.com/p/([A-Za-z0-9]{11})"
test = (
("https://imgchest.com/p/3na7kr3by8d", {
"url": "f095b4f78c051e5a94e7c663814d1e8d4c93c1f7",
"content": "076959e65be30249a2c651fbe6090dc30ba85193",
"count": 3
}),
)
def __init__(self, match):
self.gallery_id = match.group(1)
url = self.root + "/p/" + self.gallery_id
GalleryExtractor.__init__(self, match, url)
def metadata(self, page):
"""Return a dict with general metadata"""
if "Sorry, but the page you requested could not be found." in page:
raise exception.NotFoundError("gallery")
title_match = re.search(
r'<meta property="og:title" content="([^"]+)"/>',
page)
title = title_match.group(1).strip()
return {
"gallery_id": self.gallery_id,
"title": text.unescape(title)
}
def images(self, page):
"""Return a list of all (image-url, metadata)-tuples"""
image_keys = re.findall(
r'<meta property="og:image" content="([^"]+)"/>',
page)
for imgurl in image_keys:
data = text.nameext_from_url(imgurl)
yield imgurl, data

View File

@ -44,6 +44,7 @@ CATEGORY_MAP = {
"imagefap" : "ImageFap",
"imgbb" : "ImgBB",
"imgbox" : "imgbox",
"imagechest" : "ImageChest",
"imgth" : "imgth",
"imgur" : "imgur",
"jaiminisbox" : "Jaimini's Box",