You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
gallery-dl/gallery_dl/__init__.py

223 lines
6.9 KiB

# -*- coding: utf-8 -*-
# Copyright 2014-2017 Mike Fährmann
#
# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License version 2 as
# published by the Free Software Foundation.
from __future__ import unicode_literals, print_function
__author__ = "Mike Fährmann"
__copyright__ = "Copyright 2014-2017 Mike Fährmann"
__license__ = "GPLv2"
10 years ago
__maintainer__ = "Mike Fährmann"
__email__ = "mike_faehrmann@web.de"
10 years ago
import sys
if sys.hexversion < 0x3030000:
print("Python 3.3+ required", file=sys.stderr)
sys.exit(1)
10 years ago
import argparse
import logging
import json
from . import config, extractor, job, exception
from .version import __version__
10 years ago
log = logging.getLogger("gallery-dl")
class ConfigAction(argparse.Action):
"""Set argparse results directly as config values"""
def __call__(self, parser, namespace, values, option_string=None):
config.set((self.dest,), values)
def build_cmdline_parser():
parser = argparse.ArgumentParser(
10 years ago
description='Download images from various sources')
parser.add_argument(
"-g", "--get-urls", dest="list_urls", action="count",
help="Print download urls",
)
parser.add_argument(
"-d", "--dest",
metavar="DEST", action=ConfigAction, dest="base-directory",
help="Destination directory",
)
parser.add_argument(
"-u", "--username",
metavar="USER", action=ConfigAction, dest="username",
)
parser.add_argument(
"-p", "--password",
metavar="PASS", action=ConfigAction, dest="password",
)
parser.add_argument(
"-i", "--input-file",
metavar="FILE", dest="inputfile",
help="Download URLs found in local FILE ('-' for stdin)",
)
parser.add_argument(
"--images",
metavar="ITEM-SPEC", action=ConfigAction, dest="images",
help=("Specify which images to download through a comma seperated list"
" of indices or index-ranges; "
"for example '--images -2,4,6-8,10-' will download images with "
"index 1, 2, 4, 6, 7, 8 and 10 up to the last one")
)
parser.add_argument(
"--chapters",
metavar="ITEM-SPEC", action=ConfigAction, dest="chapters",
help=("Same as '--images' except for chapters")
)
parser.add_argument(
"-R", "--retries",
metavar="RETRIES", action=ConfigAction, dest="retries", type=int,
help="Number of retries (default: 5)",
)
parser.add_argument(
"--http-timeout",
metavar="SECONDS", action=ConfigAction, dest="timeout", type=int,
help="Timeout for HTTP connections (defaut: no timeout)",
)
parser.add_argument(
"-c", "--config",
metavar="CFG", dest="cfgfiles", action="append",
help="Additional configuration files",
)
parser.add_argument(
"--config-yaml",
metavar="CFG", dest="yamlfiles", action="append",
help="Additional configuration files (YAML format)",
)
parser.add_argument(
"-o", "--option",
9 years ago
metavar="OPT", action="append", default=[],
help="Additional 'key=value' option values",
)
parser.add_argument(
"--list-extractors", dest="list_extractors", action="store_true",
help=("Print a list of extractor classes "
"with description and example URL"),
)
parser.add_argument(
"--list-keywords", dest="list_keywords", action="store_true",
help="Print a list of available keywords for the given URLs",
)
parser.add_argument(
"--list-modules", dest="list_modules", action="store_true",
help="Print a list of available modules/supported sites",
)
8 years ago
parser.add_argument(
"--version", action="version", version=__version__,
help="Print program version and exit"
8 years ago
)
parser.add_argument(
"urls",
nargs="*", metavar="URL",
help="Url to download images from"
)
return parser
10 years ago
def parse_option(opt):
try:
key, value = opt.split("=", 1)
try:
value = json.loads(value)
except ValueError:
pass
config.set(key.split("."), value)
except ValueError:
log.warning("Invalid 'key=value' pair: %s", opt)
def initialize_logging():
# convert levelnames to lowercase
for level in (10, 20, 30, 40, 50):
name = logging.getLevelName(level)
logging.addLevelName(level, name.lower())
# setup basic logging to stderr
formatter = logging.Formatter("[%(name)s][%(levelname)s] %(message)s")
handler = logging.StreamHandler()
handler.setFormatter(formatter)
root = logging.getLogger()
root.setLevel(logging.INFO)
root.addHandler(handler)
def sanatize_input(file):
for line in file:
line = line.strip()
if line:
yield line
10 years ago
def main():
try:
initialize_logging()
config.load()
parser = build_cmdline_parser()
args = parser.parse_args()
if args.cfgfiles:
config.load(*args.cfgfiles, strict=True)
if args.yamlfiles:
config.load(*args.yamlfiles, format="yaml", strict=True)
for opt in args.option:
parse_option(opt)
if args.list_modules:
for module_name in extractor.modules:
print(module_name)
elif args.list_extractors:
for extr in extractor.extractors():
print(extr.__name__)
if extr.__doc__:
print(extr.__doc__)
if hasattr(extr, "test") and extr.test:
print("Example:", extr.test[0][0])
print()
else:
if not args.urls and not args.inputfile:
parser.error("the following arguments are required: URL")
if args.list_urls:
jobtype = job.UrlJob
jobtype.maxdepth = args.list_urls
elif args.list_keywords:
jobtype = job.KeywordJob
else:
jobtype = job.DownloadJob
urls = args.urls
if args.inputfile:
try:
if args.inputfile == "-":
file = sys.stdin
else:
file = open(args.inputfile)
import itertools
urls = itertools.chain(urls, sanatize_input(file))
except OSError as err:
log.error(err)
for url in urls:
try:
jobtype(url).run()
except exception.NoExtractorError:
log.error("No suitable extractor found for '%s'", url)
except KeyboardInterrupt:
print("\nKeyboardInterrupt", file=sys.stderr)
except BrokenPipeError:
pass
except IOError as err:
import errno
if err.errno != errno.EPIPE:
raise