mirror of
https://github.com/mikf/gallery-dl.git
synced 2024-11-22 18:53:21 +01:00
102 lines
3.2 KiB
Python
102 lines
3.2 KiB
Python
# -*- coding: utf-8 -*-
|
|
|
|
# Copyright 2024 Mike Fährmann
|
|
#
|
|
# This program is free software; you can redistribute it and/or modify
|
|
# it under the terms of the GNU General Public License version 2 as
|
|
# published by the Free Software Foundation.
|
|
|
|
"""Extractors for https://saint2.su/"""
|
|
|
|
from .lolisafe import LolisafeAlbumExtractor
|
|
from .. import text
|
|
|
|
BASE_PATTERN = r"(?:https?://)?saint\d*\.(?:su|pk|to)"
|
|
|
|
|
|
class SaintAlbumExtractor(LolisafeAlbumExtractor):
|
|
"""Extractor for saint albums"""
|
|
category = "saint"
|
|
root = "https://saint2.su"
|
|
pattern = BASE_PATTERN + r"/a/([^/?#]+)"
|
|
example = "https://saint2.su/a/ID"
|
|
|
|
def fetch_album(self, album_id):
|
|
# album metadata
|
|
response = self.request(self.root + "/a/" + album_id)
|
|
extr = text.extract_from(response.text)
|
|
|
|
title = extr("<title>", "<")
|
|
descr = extr('name="description" content="', '"')
|
|
files = []
|
|
|
|
while True:
|
|
id2 = extr("/thumbs/", "-")
|
|
if not id2:
|
|
break
|
|
files.append({
|
|
"id2" : id2,
|
|
"date" : text.parse_timestamp(extr("", ".")),
|
|
"id" : extr("/embed/", '"'),
|
|
"size" : text.parse_int(extr('data="', '"')),
|
|
"file" : text.unescape(extr(
|
|
"onclick=\"play(", ")").strip("\"'")),
|
|
"id_dl": extr("/d/", ")").rstrip("\"'"),
|
|
})
|
|
|
|
return files, {
|
|
"album_id" : album_id,
|
|
"album_name" : text.unescape(title.rpartition(" - ")[0]),
|
|
"album_size" : sum(file["size"] for file in files),
|
|
"description" : text.unescape(descr),
|
|
"count" : len(files),
|
|
"_http_headers": {"Referer": response.url}
|
|
}
|
|
|
|
|
|
class SaintMediaExtractor(SaintAlbumExtractor):
|
|
"""Extractor for saint media links"""
|
|
subcategory = "media"
|
|
directory_fmt = ("{category}",)
|
|
pattern = BASE_PATTERN + r"(/(embe)?d/([^/?#]+))"
|
|
example = "https://saint2.su/embed/ID"
|
|
|
|
def fetch_album(self, album_id):
|
|
try:
|
|
path, embed, _ = self.groups
|
|
|
|
url = self.root + path
|
|
response = self.request(url)
|
|
extr = text.extract_from(response.text)
|
|
|
|
if embed:
|
|
file = {
|
|
"id" : album_id,
|
|
"id2" : extr("/thumbs/", "-"),
|
|
"date" : text.parse_timestamp(extr("", ".")),
|
|
"file" : text.unescape(extr('<source src="', '"')),
|
|
"id_dl": extr("/d/", "'"),
|
|
}
|
|
|
|
else: # /d/
|
|
file = {
|
|
"file" : text.unescape(extr('<a href="', '"')),
|
|
"id_dl" : album_id,
|
|
"name" : album_id,
|
|
"filename" : album_id,
|
|
"extension": "mp4",
|
|
}
|
|
|
|
file["_http_headers"] = {"Referer": response.url}
|
|
except Exception as exc:
|
|
self.log.error("%s: %s", exc.__class__.__name__, exc)
|
|
return (), {}
|
|
|
|
return (file,), {
|
|
"album_id" : "",
|
|
"album_name" : "",
|
|
"album_size" : -1,
|
|
"description": "",
|
|
"count" : 1,
|
|
}
|