(#1680, #878) Can be used by prefixing any URL with 'ytdl:', or by setting 'extractor,ytdl.enabled' to 'true'.pull/1700/head
parent
64240c8d42
commit
36ac2197db
@ -0,0 +1,101 @@
|
||||
# -*- coding: utf-8 -*-
|
||||
|
||||
# Copyright 2021 Mike Fährmann
|
||||
#
|
||||
# This program is free software; you can redistribute it and/or modify
|
||||
# it under the terms of the GNU General Public License version 2 as
|
||||
# published by the Free Software Foundation.
|
||||
|
||||
"""Extractors for sites supported by youtube-dl"""
|
||||
|
||||
from .common import Extractor, Message
|
||||
from .. import config
|
||||
|
||||
|
||||
class YoutubeDLExtractor(Extractor):
|
||||
"""Generic extractor for youtube-dl supported URLs"""
|
||||
category = "ytdl"
|
||||
directory_fmt = ("{category}", "{subcategory}")
|
||||
filename_fmt = "{title}-{id}.{extension}"
|
||||
archive_fmt = "{extractor_key} {id}"
|
||||
ytdl_module = None
|
||||
pattern = r"ytdl:(.*)"
|
||||
test = ("ytdl:https://www.youtube.com/watch?v=BaW_jenozKc&t=1s&end=9",)
|
||||
|
||||
def __init__(self, match):
|
||||
# import youtube_dl module
|
||||
module = self.ytdl_module
|
||||
if not module:
|
||||
name = config.get(("extractor", "ytdl"), "module") or "youtube_dl"
|
||||
module = YoutubeDLExtractor.ytdl_module = __import__(name)
|
||||
|
||||
# find suitable youtube_dl extractor
|
||||
self.ytdl_url = url = match.group(1)
|
||||
for ie in module.extractor.gen_extractor_classes():
|
||||
if ie.suitable(url):
|
||||
self.ytdl_ie = ie
|
||||
break
|
||||
|
||||
# set subcategory to youtube_dl extractor's key
|
||||
self.subcategory = ie.ie_key()
|
||||
Extractor.__init__(self, match)
|
||||
|
||||
def items(self):
|
||||
# construct YoutubeDL object
|
||||
options = {
|
||||
"format": self.config("format"),
|
||||
"socket_timeout": self._timeout,
|
||||
"nocheckcertificate": not self._verify,
|
||||
"proxy": self.session.proxies.get("http"),
|
||||
}
|
||||
|
||||
raw_options = self.config("raw-options")
|
||||
if raw_options:
|
||||
options.update(raw_options)
|
||||
if self.config("logging", True):
|
||||
options["logger"] = self.log
|
||||
options["extract_flat"] = "in_playlist"
|
||||
|
||||
ytdl = self.ytdl_module.YoutubeDL(options)
|
||||
|
||||
# extract youtube_dl info_dict
|
||||
info_dict = ytdl._YoutubeDL__extract_info(
|
||||
self.ytdl_url,
|
||||
ytdl.get_info_extractor(self.ytdl_ie.ie_key()),
|
||||
False, {}, True)
|
||||
|
||||
if "entries" in info_dict:
|
||||
results = self._process_entries(ytdl, info_dict["entries"])
|
||||
else:
|
||||
results = (info_dict,)
|
||||
|
||||
# yield results
|
||||
for info_dict in results:
|
||||
info_dict["extension"] = None
|
||||
info_dict["_ytdl_info_dict"] = info_dict
|
||||
|
||||
url = "ytdl:" + (info_dict.get("url") or
|
||||
info_dict.get("webpage_url") or
|
||||
self.ytdl_url)
|
||||
|
||||
yield Message.Directory, info_dict
|
||||
yield Message.Url, url, info_dict
|
||||
|
||||
def _process_entries(self, ytdl, entries):
|
||||
for entry in entries:
|
||||
if entry.get("_type") in ("url", "url_transparent"):
|
||||
info_dict = ytdl.extract_info(
|
||||
entry["url"], False,
|
||||
ie_key=entry.get("ie_key"))
|
||||
if "entries" in info_dict:
|
||||
yield from self._process_entries(
|
||||
ytdl, info_dict["entries"])
|
||||
else:
|
||||
yield info_dict
|
||||
else:
|
||||
yield entry
|
||||
|
||||
|
||||
if config.get(("extractor", "ytdl"), "enabled"):
|
||||
# make 'ytdl:' prefix optional
|
||||
YoutubeDLExtractor.pattern = r"(?:ytdl:)?(.*)"
|
Loading…
Reference in new issue