2017-03-23 16:29:40 +01:00
|
|
|
# -*- coding: utf-8 -*-
|
|
|
|
|
2018-01-27 01:05:17 +01:00
|
|
|
# Copyright 2017-2018 Mike Fährmann
|
2017-03-23 16:29:40 +01:00
|
|
|
#
|
|
|
|
# This program is free software; you can redistribute it and/or modify
|
|
|
|
# it under the terms of the GNU General Public License version 2 as
|
|
|
|
# published by the Free Software Foundation.
|
|
|
|
|
|
|
|
"""Command line option parsing"""
|
|
|
|
|
|
|
|
import argparse
|
|
|
|
import logging
|
|
|
|
import json
|
|
|
|
from .version import __version__
|
|
|
|
|
|
|
|
|
|
|
|
class ConfigAction(argparse.Action):
|
|
|
|
"""Set argparse results as config values"""
|
|
|
|
def __call__(self, parser, namespace, values, option_string=None):
|
|
|
|
namespace.options.append(((self.dest,), values))
|
|
|
|
|
|
|
|
|
2017-05-03 15:17:08 +02:00
|
|
|
class ConfigConstAction(argparse.Action):
|
|
|
|
"""Set argparse const values as config values"""
|
|
|
|
def __call__(self, parser, namespace, values, option_string=None):
|
|
|
|
namespace.options.append(((self.dest,), self.const))
|
|
|
|
|
|
|
|
|
2017-03-23 16:29:40 +01:00
|
|
|
class ParseAction(argparse.Action):
|
|
|
|
"""Parse <key>=<value> options and set them as config values"""
|
|
|
|
def __call__(self, parser, namespace, values, option_string=None):
|
2018-01-27 01:05:17 +01:00
|
|
|
key, _, value = values.partition("=")
|
2017-03-23 16:29:40 +01:00
|
|
|
try:
|
2018-01-27 01:05:17 +01:00
|
|
|
value = json.loads(value)
|
2017-03-23 16:29:40 +01:00
|
|
|
except ValueError:
|
2018-01-27 01:05:17 +01:00
|
|
|
pass
|
|
|
|
key = key.split(".")
|
|
|
|
namespace.options.append((key, value))
|
2017-03-23 16:29:40 +01:00
|
|
|
|
|
|
|
|
|
|
|
class Formatter(argparse.HelpFormatter):
|
|
|
|
"""Custom HelpFormatter class to customize help output"""
|
|
|
|
def __init__(self, *args, **kwargs):
|
2017-03-23 16:51:42 +01:00
|
|
|
super().__init__(max_help_position=50, *args, **kwargs)
|
2017-03-23 16:29:40 +01:00
|
|
|
|
|
|
|
def _format_action_invocation(self, action):
|
|
|
|
opts = action.option_strings[:]
|
|
|
|
if opts:
|
|
|
|
if action.nargs != 0:
|
|
|
|
args_string = self._format_args(action, "ARG")
|
|
|
|
opts[-1] += " " + args_string
|
|
|
|
return ', '.join(opts)
|
|
|
|
else:
|
|
|
|
return self._metavar_formatter(action, action.dest)(1)[0]
|
|
|
|
|
|
|
|
|
|
|
|
def build_parser():
|
|
|
|
"""Build and configure an ArgumentParser object"""
|
|
|
|
parser = argparse.ArgumentParser(
|
|
|
|
usage="%(prog)s [OPTION]... URL...",
|
|
|
|
formatter_class=Formatter,
|
2017-08-16 19:56:50 +02:00
|
|
|
add_help=False,
|
2017-03-23 16:29:40 +01:00
|
|
|
)
|
2017-08-16 19:56:50 +02:00
|
|
|
|
|
|
|
general = parser.add_argument_group("General Options")
|
|
|
|
general.add_argument(
|
|
|
|
"-h", "--help",
|
|
|
|
action="help",
|
2017-09-30 18:52:23 +02:00
|
|
|
help="Print this help message and exit",
|
2017-08-16 19:56:50 +02:00
|
|
|
)
|
|
|
|
general.add_argument(
|
|
|
|
"--version",
|
|
|
|
action="version", version=__version__,
|
|
|
|
help="Print program version and exit",
|
|
|
|
)
|
|
|
|
general.add_argument(
|
2017-03-23 16:29:40 +01:00
|
|
|
"-d", "--dest",
|
|
|
|
metavar="DEST", action=ConfigAction, dest="base-directory",
|
|
|
|
help="Destination directory",
|
|
|
|
)
|
2017-08-16 19:56:50 +02:00
|
|
|
general.add_argument(
|
|
|
|
"-i", "--input-file",
|
|
|
|
metavar="FILE", dest="inputfile",
|
|
|
|
help="Download URLs found in FILE ('-' for stdin)",
|
2017-03-23 16:29:40 +01:00
|
|
|
)
|
2017-08-16 19:56:50 +02:00
|
|
|
general.add_argument(
|
|
|
|
"--cookies",
|
|
|
|
metavar="FILE", action=ConfigAction, dest="cookies",
|
|
|
|
help="File to load additional cookies from",
|
2017-03-23 16:29:40 +01:00
|
|
|
)
|
2018-02-19 18:24:56 +01:00
|
|
|
general.add_argument(
|
|
|
|
"--proxy",
|
|
|
|
metavar="URL", action=ConfigAction, dest="proxy",
|
|
|
|
help="Use the specified proxy",
|
|
|
|
)
|
2017-08-16 19:56:50 +02:00
|
|
|
|
|
|
|
output = parser.add_argument_group("Output Options")
|
|
|
|
output.add_argument(
|
|
|
|
"-q", "--quiet", dest="loglevel", action="store_const",
|
|
|
|
const=logging.ERROR, default=logging.INFO,
|
|
|
|
help="Activate quiet mode",
|
2017-03-23 16:29:40 +01:00
|
|
|
)
|
2017-08-16 19:56:50 +02:00
|
|
|
output.add_argument(
|
|
|
|
"-v", "--verbose", dest="loglevel", action="store_const",
|
|
|
|
const=logging.DEBUG, default=logging.INFO,
|
|
|
|
help="Print various debugging information",
|
2017-03-23 16:29:40 +01:00
|
|
|
)
|
2017-08-16 19:56:50 +02:00
|
|
|
output.add_argument(
|
|
|
|
"-g", "--get-urls", dest="list_urls", action="count",
|
|
|
|
help="Print URLs instead of downloading",
|
2017-03-23 16:29:40 +01:00
|
|
|
)
|
2017-08-16 19:56:50 +02:00
|
|
|
output.add_argument(
|
|
|
|
"-j", "--dump-json", dest="list_data", action="store_true",
|
|
|
|
help="Print JSON information",
|
2017-05-03 15:17:08 +02:00
|
|
|
)
|
2017-09-09 18:48:28 +02:00
|
|
|
output.add_argument(
|
|
|
|
"-K", "--list-keywords", dest="list_keywords", action="store_true",
|
2017-09-30 18:52:23 +02:00
|
|
|
help=("Print a list of available keywords and example values "
|
|
|
|
"for the given URLs"),
|
2017-09-09 18:48:28 +02:00
|
|
|
)
|
2017-08-16 19:56:50 +02:00
|
|
|
output.add_argument(
|
|
|
|
"--list-modules", dest="list_modules", action="store_true",
|
|
|
|
help="Print a list of available extractor modules",
|
|
|
|
)
|
|
|
|
output.add_argument(
|
|
|
|
"--list-extractors", dest="list_extractors", action="store_true",
|
|
|
|
help=("Print a list of extractor classes "
|
|
|
|
"with description, (sub)category and example URL"),
|
|
|
|
)
|
2018-01-26 18:51:51 +01:00
|
|
|
output.add_argument(
|
|
|
|
"--write-log",
|
|
|
|
metavar="FILE", dest="logfile", action=ConfigAction,
|
|
|
|
help=("Write logging output to FILE"),
|
|
|
|
)
|
|
|
|
output.add_argument(
|
|
|
|
"--write-unsupported",
|
2018-01-28 18:42:10 +01:00
|
|
|
metavar="FILE", dest="unsupportedfile", action=ConfigAction,
|
2018-01-26 18:51:51 +01:00
|
|
|
help=("Write URLs, which get emitted by other extractors but cannot "
|
|
|
|
"be handled, to FILE"),
|
|
|
|
)
|
2017-08-16 19:56:50 +02:00
|
|
|
|
|
|
|
downloader = parser.add_argument_group("Downloader Options")
|
2017-12-02 01:47:26 +01:00
|
|
|
downloader.add_argument(
|
|
|
|
"-r", "--limit-rate",
|
|
|
|
metavar="RATE", action=ConfigAction, dest="rate",
|
|
|
|
help="Maximum download rate (e.g. 500k or 2.5M)",
|
|
|
|
)
|
2017-08-16 19:56:50 +02:00
|
|
|
downloader.add_argument(
|
2017-03-23 16:29:40 +01:00
|
|
|
"-R", "--retries",
|
|
|
|
metavar="RETRIES", action=ConfigAction, dest="retries", type=int,
|
|
|
|
help="Number of retries (default: 5)",
|
|
|
|
)
|
2017-08-16 19:56:50 +02:00
|
|
|
downloader.add_argument(
|
2017-03-23 16:29:40 +01:00
|
|
|
"--http-timeout",
|
2017-05-03 15:17:08 +02:00
|
|
|
metavar="SECONDS", action=ConfigAction, dest="timeout", type=float,
|
2017-12-05 23:29:11 +01:00
|
|
|
help="Timeout for HTTP connections (defaut: 30.0)",
|
2017-03-23 16:29:40 +01:00
|
|
|
)
|
2017-12-04 17:06:17 +01:00
|
|
|
downloader.add_argument(
|
|
|
|
"--sleep",
|
|
|
|
metavar="SECONDS", action=ConfigAction, dest="sleep", type=float,
|
|
|
|
help="Number of seconds to sleep before each download",
|
|
|
|
)
|
2017-10-24 23:33:44 +02:00
|
|
|
downloader.add_argument(
|
|
|
|
"--no-part",
|
|
|
|
action=ConfigConstAction, nargs=0, dest="part", const=False,
|
|
|
|
help="Do not use .part files",
|
|
|
|
)
|
2017-08-16 19:56:50 +02:00
|
|
|
downloader.add_argument(
|
|
|
|
"--abort-on-skip",
|
|
|
|
action=ConfigConstAction, nargs=0, dest="skip", const="abort",
|
|
|
|
help=("Abort extractor run if a file download would normally be "
|
2017-09-30 18:52:23 +02:00
|
|
|
"skipped, i.e. if a file with the same filename already exists"),
|
2017-07-03 15:02:19 +02:00
|
|
|
)
|
2017-08-16 19:56:50 +02:00
|
|
|
|
|
|
|
configuration = parser.add_argument_group("Configuration Options")
|
|
|
|
configuration.add_argument(
|
2017-03-23 16:29:40 +01:00
|
|
|
"-c", "--config",
|
|
|
|
metavar="CFG", dest="cfgfiles", action="append",
|
|
|
|
help="Additional configuration files",
|
|
|
|
)
|
2017-08-16 19:56:50 +02:00
|
|
|
configuration.add_argument(
|
2017-03-23 16:29:40 +01:00
|
|
|
"--config-yaml",
|
|
|
|
metavar="CFG", dest="yamlfiles", action="append",
|
|
|
|
help="Additional configuration files (YAML format)",
|
|
|
|
)
|
2017-08-16 19:56:50 +02:00
|
|
|
configuration.add_argument(
|
2017-04-25 17:09:10 +02:00
|
|
|
"--ignore-config", dest="load_config", action="store_false",
|
|
|
|
help="Do not read the default configuration files",
|
|
|
|
)
|
2017-08-16 19:56:50 +02:00
|
|
|
configuration.add_argument(
|
2017-03-23 16:29:40 +01:00
|
|
|
"-o", "--option",
|
|
|
|
metavar="OPT", action=ParseAction, dest="options", default=[],
|
|
|
|
help="Additional '<key>=<value>' option values",
|
|
|
|
)
|
2017-08-16 19:56:50 +02:00
|
|
|
|
|
|
|
authentication = parser.add_argument_group("Authentication Options")
|
|
|
|
authentication.add_argument(
|
|
|
|
"-u", "--username",
|
|
|
|
metavar="USER", action=ConfigAction, dest="username",
|
2017-12-05 23:29:11 +01:00
|
|
|
help="A username to login with"
|
2017-03-23 16:29:40 +01:00
|
|
|
)
|
2017-08-16 19:56:50 +02:00
|
|
|
authentication.add_argument(
|
|
|
|
"-p", "--password",
|
|
|
|
metavar="PASS", action=ConfigAction, dest="password",
|
2017-12-05 23:29:11 +01:00
|
|
|
help="The password associated with the given username",
|
2017-03-23 16:29:40 +01:00
|
|
|
)
|
2017-08-16 19:56:50 +02:00
|
|
|
authentication.add_argument(
|
|
|
|
"--netrc",
|
|
|
|
action=ConfigConstAction, nargs=0, dest="netrc", const=True,
|
2017-12-05 23:29:11 +01:00
|
|
|
help="Enable .netrc authentication data",
|
2017-04-26 11:33:19 +02:00
|
|
|
)
|
2017-08-16 19:56:50 +02:00
|
|
|
|
|
|
|
selection = parser.add_argument_group("Selection Options")
|
2018-02-01 22:00:44 +01:00
|
|
|
selection.add_argument(
|
|
|
|
"--download-archive",
|
|
|
|
metavar="FILE", dest="archive", action=ConfigAction,
|
|
|
|
help=("Record all downloaded files in the archive file and "
|
|
|
|
"skip downloading any file already in it.")
|
|
|
|
)
|
2017-08-16 19:56:50 +02:00
|
|
|
selection.add_argument(
|
2017-09-23 17:31:40 +02:00
|
|
|
"--range",
|
|
|
|
metavar="RANGE", dest="image_range",
|
2017-08-16 19:56:50 +02:00
|
|
|
help=("Specify which images to download through a comma seperated list"
|
|
|
|
" of indices or index-ranges; "
|
2017-09-30 18:52:23 +02:00
|
|
|
"for example '--range -2,4,6-8,10-' will download images with "
|
2017-09-08 17:52:00 +02:00
|
|
|
"index 1, 2, 4, 6, 7, 8 and 10 up to the last one"),
|
2017-04-18 11:38:48 +02:00
|
|
|
)
|
2017-08-16 19:56:50 +02:00
|
|
|
selection.add_argument(
|
2017-09-23 17:31:40 +02:00
|
|
|
"--chapter-range",
|
|
|
|
metavar="RANGE", dest="chapter_range",
|
2017-09-30 18:52:23 +02:00
|
|
|
help=("Same as '--range' except for chapters "
|
2017-10-09 23:20:17 +02:00
|
|
|
"and other delegated URLs"),
|
2017-09-08 17:52:00 +02:00
|
|
|
)
|
|
|
|
selection.add_argument(
|
|
|
|
"--filter",
|
|
|
|
metavar="EXPR", dest="image_filter",
|
|
|
|
help=("Python expression controlling which images to download. Images "
|
|
|
|
"for which the expression evaluates to False are ignored. "
|
2017-12-05 23:29:11 +01:00
|
|
|
"Available keys are the filename-specific ones listed by '-K'. "
|
|
|
|
"Example: --filter \"image_width >= 1000 and "
|
2017-09-08 17:52:00 +02:00
|
|
|
"rating in ('s', 'q')\""),
|
|
|
|
)
|
|
|
|
selection.add_argument(
|
|
|
|
"--chapter-filter",
|
|
|
|
metavar="EXPR", dest="chapter_filter",
|
2017-09-30 18:52:23 +02:00
|
|
|
help=("Same as '--filter' except for chapters "
|
2017-10-09 23:20:17 +02:00
|
|
|
"and other delegated URLs"),
|
2017-09-23 17:31:40 +02:00
|
|
|
)
|
2017-08-16 19:56:50 +02:00
|
|
|
|
2017-03-23 16:29:40 +01:00
|
|
|
parser.add_argument(
|
|
|
|
"urls",
|
|
|
|
nargs="*", metavar="URL",
|
2017-08-16 19:56:50 +02:00
|
|
|
help=argparse.SUPPRESS,
|
2017-03-23 16:29:40 +01:00
|
|
|
)
|
2017-08-16 19:56:50 +02:00
|
|
|
|
2017-03-23 16:29:40 +01:00
|
|
|
return parser
|