2021-06-12 16:02:19 -04:00
|
|
|
import functools
|
2022-03-24 23:01:45 -04:00
|
|
|
import json
|
2015-04-08 11:40:31 -04:00
|
|
|
import os
|
|
|
|
|
2023-07-09 03:53:02 -04:00
|
|
|
from ..networking import Request
|
|
|
|
from ..networking.exceptions import HTTPError, network_exceptions
|
2015-04-08 11:40:31 -04:00
|
|
|
from ..utils import (
|
2022-04-11 18:32:57 -04:00
|
|
|
PostProcessingError,
|
2022-08-01 16:13:18 -04:00
|
|
|
RetryManager,
|
2021-08-23 17:45:44 -04:00
|
|
|
_configuration_args,
|
2022-08-30 11:28:28 -04:00
|
|
|
deprecation_warning,
|
2015-04-08 11:40:31 -04:00
|
|
|
encodeFilename,
|
|
|
|
)
|
2014-01-06 23:59:22 -05:00
|
|
|
|
|
|
|
|
2021-10-08 15:11:59 -04:00
|
|
|
class PostProcessorMetaClass(type):
|
|
|
|
@staticmethod
|
|
|
|
def run_wrapper(func):
|
|
|
|
@functools.wraps(func)
|
|
|
|
def run(self, info, *args, **kwargs):
|
2021-12-20 01:06:46 -05:00
|
|
|
info_copy = self._copy_infodict(info)
|
2021-10-16 09:01:00 -04:00
|
|
|
self._hook_progress({'status': 'started'}, info_copy)
|
2021-10-08 15:11:59 -04:00
|
|
|
ret = func(self, info, *args, **kwargs)
|
|
|
|
if ret is not None:
|
|
|
|
_, info = ret
|
2021-10-16 09:01:00 -04:00
|
|
|
self._hook_progress({'status': 'finished'}, info_copy)
|
2021-10-08 15:11:59 -04:00
|
|
|
return ret
|
|
|
|
return run
|
|
|
|
|
|
|
|
def __new__(cls, name, bases, attrs):
|
|
|
|
if 'run' in attrs:
|
|
|
|
attrs['run'] = cls.run_wrapper(attrs['run'])
|
|
|
|
return type.__new__(cls, name, bases, attrs)
|
|
|
|
|
|
|
|
|
|
|
|
class PostProcessor(metaclass=PostProcessorMetaClass):
|
2014-01-06 23:59:22 -05:00
|
|
|
"""Post Processor class.
|
|
|
|
|
|
|
|
PostProcessor objects can be added to downloaders with their
|
|
|
|
add_post_processor() method. When the downloader has finished a
|
|
|
|
successful download, it will take its internal chain of PostProcessors
|
|
|
|
and start calling the run() method on each one of them, first with
|
|
|
|
an initial argument and then with the returned value of the previous
|
|
|
|
PostProcessor.
|
|
|
|
|
|
|
|
PostProcessor objects follow a "mutual registration" process similar
|
2015-07-11 12:41:33 -04:00
|
|
|
to InfoExtractor objects.
|
|
|
|
|
|
|
|
Optionally PostProcessor can use a list of additional command-line arguments
|
|
|
|
with self._configuration_args.
|
2014-01-06 23:59:22 -05:00
|
|
|
"""
|
|
|
|
|
|
|
|
_downloader = None
|
|
|
|
|
2015-07-01 19:12:26 -04:00
|
|
|
def __init__(self, downloader=None):
|
2021-10-08 15:11:59 -04:00
|
|
|
self._progress_hooks = []
|
|
|
|
self.add_progress_hook(self.report_progress)
|
|
|
|
self.set_downloader(downloader)
|
2021-01-20 11:07:40 -05:00
|
|
|
self.PP_NAME = self.pp_key()
|
|
|
|
|
|
|
|
@classmethod
|
|
|
|
def pp_key(cls):
|
|
|
|
name = cls.__name__[:-2]
|
2022-03-24 23:01:45 -04:00
|
|
|
return name[6:] if name[:6].lower() == 'ffmpeg' else name
|
2021-01-07 14:28:41 -05:00
|
|
|
|
2021-01-20 15:07:02 -05:00
|
|
|
def to_screen(self, text, prefix=True, *args, **kwargs):
|
2021-01-10 08:44:54 -05:00
|
|
|
if self._downloader:
|
2024-06-11 19:09:58 -04:00
|
|
|
tag = f'[{self.PP_NAME}] ' if prefix else ''
|
2022-04-11 11:10:28 -04:00
|
|
|
return self._downloader.to_screen(f'{tag}{text}', *args, **kwargs)
|
2021-01-10 08:44:54 -05:00
|
|
|
|
|
|
|
def report_warning(self, text, *args, **kwargs):
|
|
|
|
if self._downloader:
|
|
|
|
return self._downloader.report_warning(text, *args, **kwargs)
|
|
|
|
|
2022-08-30 11:28:28 -04:00
|
|
|
def deprecation_warning(self, msg):
|
|
|
|
warn = getattr(self._downloader, 'deprecation_warning', deprecation_warning)
|
|
|
|
return warn(msg, stacklevel=1)
|
|
|
|
|
|
|
|
def deprecated_feature(self, msg):
|
2021-11-29 12:46:06 -05:00
|
|
|
if self._downloader:
|
2022-08-30 11:28:28 -04:00
|
|
|
return self._downloader.deprecated_feature(msg)
|
|
|
|
return deprecation_warning(msg, stacklevel=1)
|
2021-11-29 12:46:06 -05:00
|
|
|
|
2021-01-10 08:44:54 -05:00
|
|
|
def report_error(self, text, *args, **kwargs):
|
2022-04-17 13:49:53 -04:00
|
|
|
self.deprecation_warning('"yt_dlp.postprocessor.PostProcessor.report_error" is deprecated. '
|
|
|
|
'raise "yt_dlp.utils.PostProcessingError" instead')
|
2021-01-10 08:44:54 -05:00
|
|
|
if self._downloader:
|
|
|
|
return self._downloader.report_error(text, *args, **kwargs)
|
|
|
|
|
2021-05-14 03:45:29 -04:00
|
|
|
def write_debug(self, text, *args, **kwargs):
|
|
|
|
if self._downloader:
|
|
|
|
return self._downloader.write_debug(text, *args, **kwargs)
|
2021-01-10 08:44:54 -05:00
|
|
|
|
2022-04-30 19:28:26 -04:00
|
|
|
def _delete_downloaded_files(self, *files_to_delete, **kwargs):
|
2022-05-09 07:54:28 -04:00
|
|
|
if self._downloader:
|
|
|
|
return self._downloader._delete_downloaded_files(*files_to_delete, **kwargs)
|
|
|
|
for filename in set(filter(None, files_to_delete)):
|
|
|
|
os.remove(filename)
|
2022-04-30 19:28:26 -04:00
|
|
|
|
2021-01-10 08:44:54 -05:00
|
|
|
def get_param(self, name, default=None, *args, **kwargs):
|
|
|
|
if self._downloader:
|
|
|
|
return self._downloader.params.get(name, default, *args, **kwargs)
|
|
|
|
return default
|
2014-01-06 23:59:22 -05:00
|
|
|
|
|
|
|
def set_downloader(self, downloader):
|
|
|
|
"""Sets the downloader for this PP."""
|
|
|
|
self._downloader = downloader
|
2021-10-09 16:53:42 -04:00
|
|
|
for ph in getattr(downloader, '_postprocessor_hooks', []):
|
2021-10-08 15:11:59 -04:00
|
|
|
self.add_progress_hook(ph)
|
2014-01-06 23:59:22 -05:00
|
|
|
|
2021-10-16 09:01:00 -04:00
|
|
|
def _copy_infodict(self, info_dict):
|
|
|
|
return getattr(self._downloader, '_copy_infodict', dict)(info_dict)
|
|
|
|
|
2021-06-12 16:02:19 -04:00
|
|
|
@staticmethod
|
2022-02-18 12:46:16 -05:00
|
|
|
def _restrict_to(*, video=True, audio=True, images=True, simulated=True):
|
2021-06-12 16:02:19 -04:00
|
|
|
allowed = {'video': video, 'audio': audio, 'images': images}
|
|
|
|
|
|
|
|
def decorator(func):
|
|
|
|
@functools.wraps(func)
|
|
|
|
def wrapper(self, info):
|
2022-02-18 12:46:16 -05:00
|
|
|
if not simulated and (self.get_param('simulate') or self.get_param('skip_download')):
|
|
|
|
return [], info
|
2021-06-12 16:02:19 -04:00
|
|
|
format_type = (
|
2021-06-13 16:35:57 -04:00
|
|
|
'video' if info.get('vcodec') != 'none'
|
|
|
|
else 'audio' if info.get('acodec') != 'none'
|
2021-06-12 16:02:19 -04:00
|
|
|
else 'images')
|
|
|
|
if allowed[format_type]:
|
2021-06-13 05:06:13 -04:00
|
|
|
return func(self, info)
|
2021-06-12 16:02:19 -04:00
|
|
|
else:
|
2024-06-11 19:09:58 -04:00
|
|
|
self.to_screen(f'Skipping {format_type}')
|
2021-06-12 16:02:19 -04:00
|
|
|
return [], info
|
|
|
|
return wrapper
|
|
|
|
return decorator
|
|
|
|
|
2014-01-06 23:59:22 -05:00
|
|
|
def run(self, information):
|
|
|
|
"""Run the PostProcessor.
|
|
|
|
|
|
|
|
The "information" argument is a dictionary like the ones
|
|
|
|
composed by InfoExtractors. The only difference is that this
|
|
|
|
one has an extra field called "filepath" that points to the
|
|
|
|
downloaded file.
|
|
|
|
|
2015-04-18 05:36:42 -04:00
|
|
|
This method returns a tuple, the first element is a list of the files
|
|
|
|
that can be deleted, and the second of which is the updated
|
|
|
|
information.
|
2014-01-06 23:59:22 -05:00
|
|
|
|
|
|
|
In addition, this method may raise a PostProcessingError
|
|
|
|
exception if post processing fails.
|
|
|
|
"""
|
2015-04-18 05:36:42 -04:00
|
|
|
return [], information # by default, keep file and do nothing
|
2014-01-06 23:59:22 -05:00
|
|
|
|
2015-04-08 11:40:31 -04:00
|
|
|
def try_utime(self, path, atime, mtime, errnote='Cannot update utime of file'):
|
|
|
|
try:
|
|
|
|
os.utime(encodeFilename(path), (atime, mtime))
|
|
|
|
except Exception:
|
2021-01-10 08:44:54 -05:00
|
|
|
self.report_warning(errnote)
|
2015-04-08 11:40:31 -04:00
|
|
|
|
2021-08-23 17:45:44 -04:00
|
|
|
def _configuration_args(self, exe, *args, **kwargs):
|
|
|
|
return _configuration_args(
|
|
|
|
self.pp_key(), self.get_param('postprocessor_args'), exe, *args, **kwargs)
|
2015-07-11 12:41:33 -04:00
|
|
|
|
2021-10-08 15:11:59 -04:00
|
|
|
def _hook_progress(self, status, info_dict):
|
|
|
|
if not self._progress_hooks:
|
|
|
|
return
|
|
|
|
status.update({
|
2021-10-16 09:01:00 -04:00
|
|
|
'info_dict': info_dict,
|
2021-10-08 15:11:59 -04:00
|
|
|
'postprocessor': self.pp_key(),
|
|
|
|
})
|
|
|
|
for ph in self._progress_hooks:
|
|
|
|
ph(status)
|
|
|
|
|
|
|
|
def add_progress_hook(self, ph):
|
|
|
|
# See YoutubeDl.py (search for postprocessor_hooks) for a description of this interface
|
|
|
|
self._progress_hooks.append(ph)
|
|
|
|
|
|
|
|
def report_progress(self, s):
|
2024-06-11 19:09:58 -04:00
|
|
|
s['_default_template'] = '%(postprocessor)s %(status)s' % s # noqa: UP031
|
2022-05-26 19:06:23 -04:00
|
|
|
if not self._downloader:
|
|
|
|
return
|
2021-10-08 15:11:59 -04:00
|
|
|
|
|
|
|
progress_dict = s.copy()
|
|
|
|
progress_dict.pop('info_dict')
|
|
|
|
progress_dict = {'info': s['info_dict'], 'progress': progress_dict}
|
|
|
|
|
|
|
|
progress_template = self.get_param('progress_template', {})
|
|
|
|
tmpl = progress_template.get('postprocess')
|
|
|
|
if tmpl:
|
2022-05-26 19:06:23 -04:00
|
|
|
self._downloader.to_screen(
|
2023-06-14 09:39:53 -04:00
|
|
|
self._downloader.evaluate_outtmpl(tmpl, progress_dict), quiet=False)
|
2021-10-08 15:11:59 -04:00
|
|
|
|
|
|
|
self._downloader.to_console_title(self._downloader.evaluate_outtmpl(
|
|
|
|
progress_template.get('postprocess-title') or 'yt-dlp %(progress._default_template)s',
|
|
|
|
progress_dict))
|
|
|
|
|
2022-08-01 16:13:18 -04:00
|
|
|
def _retry_download(self, err, count, retries):
|
2022-03-24 23:01:45 -04:00
|
|
|
# While this is not an extractor, it behaves similar to one and
|
2022-10-18 13:28:49 -04:00
|
|
|
# so obey extractor_retries and "--retry-sleep extractor"
|
2022-08-01 16:13:18 -04:00
|
|
|
RetryManager.report_retry(err, count, retries, info=self.to_screen, warn=self.report_warning,
|
2022-10-18 13:28:49 -04:00
|
|
|
sleep_func=self.get_param('retry_sleep_functions', {}).get('extractor'))
|
2022-03-24 23:01:45 -04:00
|
|
|
|
2022-08-01 16:13:18 -04:00
|
|
|
def _download_json(self, url, *, expected_http_errors=(404,)):
|
2022-03-24 23:01:45 -04:00
|
|
|
self.write_debug(f'{self.PP_NAME} query: {url}')
|
2022-08-01 16:13:18 -04:00
|
|
|
for retry in RetryManager(self.get_param('extractor_retries', 3), self._retry_download):
|
2022-03-24 23:01:45 -04:00
|
|
|
try:
|
2023-07-09 03:53:02 -04:00
|
|
|
rsp = self._downloader.urlopen(Request(url))
|
2022-03-24 23:01:45 -04:00
|
|
|
except network_exceptions as e:
|
2023-07-09 03:53:02 -04:00
|
|
|
if isinstance(e, HTTPError) and e.status in expected_http_errors:
|
2022-03-24 23:01:45 -04:00
|
|
|
return None
|
2022-08-01 16:13:18 -04:00
|
|
|
retry.error = PostProcessingError(f'Unable to communicate with {self.PP_NAME} API: {e}')
|
|
|
|
continue
|
2023-07-09 03:53:02 -04:00
|
|
|
return json.loads(rsp.read().decode(rsp.headers.get_param('charset') or 'utf-8'))
|
2022-03-24 23:01:45 -04:00
|
|
|
|
2014-01-06 23:59:22 -05:00
|
|
|
|
2022-06-06 12:19:57 -04:00
|
|
|
class AudioConversionError(PostProcessingError): # Deprecated
|
2014-01-06 23:59:22 -05:00
|
|
|
pass
|