1
0
mirror of https://github.com/mikf/gallery-dl.git synced 2024-11-23 11:12:40 +01:00
gallery-dl/gallery_dl/extractor/urlshortener.py

53 lines
1.6 KiB
Python
Raw Normal View History

# -*- coding: utf-8 -*-
# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License version 2 as
# published by the Free Software Foundation.
2023-04-15 18:06:06 +02:00
"""Extractors for general-purpose URL shorteners"""
from .common import BaseExtractor, Message
from .. import exception
class UrlshortenerExtractor(BaseExtractor):
2023-04-15 18:06:06 +02:00
"""Base class for URL shortener extractors"""
basecategory = "urlshortener"
2023-04-15 18:06:06 +02:00
BASE_PATTERN = UrlshortenerExtractor.update({
2023-04-15 18:06:06 +02:00
"bitly": {
"root": "https://bit.ly",
"pattern": r"bit\.ly",
},
"tco": {
# t.co sends 'http-equiv="refresh"' (200) when using browser UA
"headers": {"User-Agent": None},
"root": "https://t.co",
"pattern": r"t\.co",
},
})
2023-04-15 18:06:06 +02:00
class UrlshortenerLinkExtractor(UrlshortenerExtractor):
"""Extractor for general-purpose URL shorteners"""
subcategory = "link"
pattern = BASE_PATTERN + r"/([^/?#]+)"
example = "https://bit.ly/abcde"
def __init__(self, match):
2023-04-15 18:06:06 +02:00
UrlshortenerExtractor.__init__(self, match)
2023-04-09 12:06:42 +02:00
self.id = match.group(match.lastindex)
def _init(self):
self.headers = self.config_instance("headers")
def items(self):
response = self.request(
2023-04-15 18:06:06 +02:00
"{}/{}".format(self.root, self.id), headers=self.headers,
method="HEAD", allow_redirects=False, notfound="URL")
try:
yield Message.Queue, response.headers["location"], {}
except KeyError:
raise exception.StopExtraction("Unable to resolve short URL")