mirror of
https://github.com/yt-dlp/yt-dlp.git
synced 2024-11-21 20:46:36 -05:00
250 lines
10 KiB
Python
250 lines
10 KiB
Python
# coding: utf-8
|
|
from __future__ import unicode_literals
|
|
|
|
import re
|
|
|
|
from .common import InfoExtractor
|
|
from ..compat import compat_str
|
|
from ..utils import (
|
|
int_or_none,
|
|
parse_resolution,
|
|
try_get,
|
|
unified_timestamp,
|
|
url_or_none,
|
|
urljoin,
|
|
)
|
|
|
|
|
|
class PeerTubeIE(InfoExtractor):
|
|
_INSTANCES_RE = r'''(?:
|
|
# Taken from https://instances.joinpeertube.org/instances
|
|
tube\.openalgeria\.org|
|
|
peertube\.pointsecu\.fr|
|
|
peertube\.nogafa\.org|
|
|
peertube\.pl|
|
|
megatube\.lilomoino\.fr|
|
|
peertube\.tamanoir\.foucry\.net|
|
|
peertube\.inapurna\.org|
|
|
peertube\.netzspielplatz\.de|
|
|
video\.deadsuperhero\.com|
|
|
peertube\.devosi\.org|
|
|
peertube\.1312\.media|
|
|
tube\.worldofhauru\.xyz|
|
|
tube\.bootlicker\.party|
|
|
skeptikon\.fr|
|
|
peertube\.geekshell\.fr|
|
|
tube\.opportunis\.me|
|
|
peertube\.peshane\.net|
|
|
video\.blueline\.mg|
|
|
tube\.homecomputing\.fr|
|
|
videos\.cloudfrancois\.fr|
|
|
peertube\.viviers-fibre\.net|
|
|
tube\.ouahpiti\.info|
|
|
video\.tedomum\.net|
|
|
video\.g3l\.org|
|
|
fontube\.fr|
|
|
peertube\.gaialabs\.ch|
|
|
peertube\.extremely\.online|
|
|
peertube\.public-infrastructure\.eu|
|
|
tube\.kher\.nl|
|
|
peertube\.qtg\.fr|
|
|
tube\.22decembre\.eu|
|
|
facegirl\.me|
|
|
video\.migennes\.net|
|
|
janny\.moe|
|
|
tube\.p2p\.legal|
|
|
video\.atlanti\.se|
|
|
troll\.tv|
|
|
peertube\.geekael\.fr|
|
|
vid\.leotindall\.com|
|
|
video\.anormallostpod\.ovh|
|
|
p-tube\.h3z\.jp|
|
|
tube\.darfweb\.eu|
|
|
videos\.iut-orsay\.fr|
|
|
peertube\.solidev\.net|
|
|
videos\.symphonie-of-code\.fr|
|
|
testtube\.ortg\.de|
|
|
videos\.cemea\.org|
|
|
peertube\.gwendalavir\.eu|
|
|
video\.passageenseine\.fr|
|
|
videos\.festivalparminous\.org|
|
|
peertube\.touhoppai\.moe|
|
|
peertube\.duckdns\.org|
|
|
sikke\.fi|
|
|
peertube\.mastodon\.host|
|
|
firedragonvideos\.com|
|
|
vidz\.dou\.bet|
|
|
peertube\.koehn\.com|
|
|
peer\.hostux\.social|
|
|
share\.tube|
|
|
peertube\.walkingmountains\.fr|
|
|
medias\.libox\.fr|
|
|
peertube\.moe|
|
|
peertube\.xyz|
|
|
jp\.peertube\.network|
|
|
videos\.benpro\.fr|
|
|
tube\.otter\.sh|
|
|
peertube\.angristan\.xyz|
|
|
peertube\.parleur\.net|
|
|
peer\.ecutsa\.fr|
|
|
peertube\.heraut\.eu|
|
|
peertube\.tifox\.fr|
|
|
peertube\.maly\.io|
|
|
vod\.mochi\.academy|
|
|
exode\.me|
|
|
coste\.video|
|
|
tube\.aquilenet\.fr|
|
|
peertube\.gegeweb\.eu|
|
|
framatube\.org|
|
|
thinkerview\.video|
|
|
tube\.conferences-gesticulees\.net|
|
|
peertube\.datagueule\.tv|
|
|
video\.lqdn\.fr|
|
|
meilleurtube\.delire\.party|
|
|
tube\.mochi\.academy|
|
|
peertube\.dav\.li|
|
|
media\.zat\.im|
|
|
pytu\.be|
|
|
peertube\.valvin\.fr|
|
|
peertube\.nsa\.ovh|
|
|
video\.colibris-outilslibres\.org|
|
|
video\.hispagatos\.org|
|
|
tube\.svnet\.fr|
|
|
peertube\.video|
|
|
videos\.lecygnenoir\.info|
|
|
peertube3\.cpy\.re|
|
|
peertube2\.cpy\.re|
|
|
videos\.tcit\.fr|
|
|
peertube\.cpy\.re
|
|
)'''
|
|
_UUID_RE = r'[\da-fA-F]{8}-[\da-fA-F]{4}-[\da-fA-F]{4}-[\da-fA-F]{4}-[\da-fA-F]{12}'
|
|
_VALID_URL = r'''(?x)
|
|
(?:
|
|
peertube:(?P<host>[^:]+):|
|
|
https?://(?P<host_2>%s)/(?:videos/(?:watch|embed)|api/v\d/videos)/
|
|
)
|
|
(?P<id>%s)
|
|
''' % (_INSTANCES_RE, _UUID_RE)
|
|
_TESTS = [{
|
|
'url': 'https://peertube.moe/videos/watch/2790feb0-8120-4e63-9af3-c943c69f5e6c',
|
|
'md5': '80f24ff364cc9d333529506a263e7feb',
|
|
'info_dict': {
|
|
'id': '2790feb0-8120-4e63-9af3-c943c69f5e6c',
|
|
'ext': 'mp4',
|
|
'title': 'wow',
|
|
'description': 'wow such video, so gif',
|
|
'thumbnail': r're:https?://.*\.(?:jpg|png)',
|
|
'timestamp': 1519297480,
|
|
'upload_date': '20180222',
|
|
'uploader': 'Luclu7',
|
|
'uploader_id': '7fc42640-efdb-4505-a45d-a15b1a5496f1',
|
|
'uploder_url': 'https://peertube.nsa.ovh/accounts/luclu7',
|
|
'license': 'Unknown',
|
|
'duration': 3,
|
|
'view_count': int,
|
|
'like_count': int,
|
|
'dislike_count': int,
|
|
'tags': list,
|
|
'categories': list,
|
|
}
|
|
}, {
|
|
'url': 'https://peertube.tamanoir.foucry.net/videos/watch/0b04f13d-1e18-4f1d-814e-4979aa7c9c44',
|
|
'only_matching': True,
|
|
}, {
|
|
# nsfw
|
|
'url': 'https://tube.22decembre.eu/videos/watch/9bb88cd3-9959-46d9-9ab9-33d2bb704c39',
|
|
'only_matching': True,
|
|
}, {
|
|
'url': 'https://tube.22decembre.eu/videos/embed/fed67262-6edb-4d1c-833b-daa9085c71d7',
|
|
'only_matching': True,
|
|
}, {
|
|
'url': 'https://tube.openalgeria.org/api/v1/videos/c1875674-97d0-4c94-a058-3f7e64c962e8',
|
|
'only_matching': True,
|
|
}, {
|
|
'url': 'peertube:video.blender.org:b37a5b9f-e6b5-415c-b700-04a5cd6ec205',
|
|
'only_matching': True,
|
|
}]
|
|
|
|
@staticmethod
|
|
def _extract_peertube_url(webpage, source_url):
|
|
mobj = re.match(
|
|
r'https?://(?P<host>[^/]+)/videos/(?:watch|embed)/(?P<id>%s)'
|
|
% PeerTubeIE._UUID_RE, source_url)
|
|
if mobj and any(p in webpage for p in (
|
|
'<title>PeerTube<',
|
|
'There will be other non JS-based clients to access PeerTube',
|
|
'>We are sorry but it seems that PeerTube is not compatible with your web browser.<')):
|
|
return 'peertube:%s:%s' % mobj.group('host', 'id')
|
|
|
|
@staticmethod
|
|
def _extract_urls(webpage, source_url):
|
|
entries = re.findall(
|
|
r'''(?x)<iframe[^>]+\bsrc=["\'](?P<url>(?:https?:)?//%s/videos/embed/%s)'''
|
|
% (PeerTubeIE._INSTANCES_RE, PeerTubeIE._UUID_RE), webpage)
|
|
if not entries:
|
|
peertube_url = PeerTubeIE._extract_peertube_url(webpage, source_url)
|
|
if peertube_url:
|
|
entries = [peertube_url]
|
|
return entries
|
|
|
|
def _real_extract(self, url):
|
|
mobj = re.match(self._VALID_URL, url)
|
|
host = mobj.group('host') or mobj.group('host_2')
|
|
video_id = mobj.group('id')
|
|
|
|
video = self._download_json(
|
|
'https://%s/api/v1/videos/%s' % (host, video_id), video_id)
|
|
|
|
title = video['name']
|
|
|
|
formats = []
|
|
for file_ in video['files']:
|
|
if not isinstance(file_, dict):
|
|
continue
|
|
file_url = url_or_none(file_.get('fileUrl'))
|
|
if not file_url:
|
|
continue
|
|
file_size = int_or_none(file_.get('size'))
|
|
format_id = try_get(
|
|
file_, lambda x: x['resolution']['label'], compat_str)
|
|
f = parse_resolution(format_id)
|
|
f.update({
|
|
'url': file_url,
|
|
'format_id': format_id,
|
|
'filesize': file_size,
|
|
})
|
|
formats.append(f)
|
|
self._sort_formats(formats)
|
|
|
|
def account_data(field):
|
|
return try_get(video, lambda x: x['account'][field], compat_str)
|
|
|
|
category = try_get(video, lambda x: x['category']['label'], compat_str)
|
|
categories = [category] if category else None
|
|
|
|
nsfw = video.get('nsfw')
|
|
if nsfw is bool:
|
|
age_limit = 18 if nsfw else 0
|
|
else:
|
|
age_limit = None
|
|
|
|
return {
|
|
'id': video_id,
|
|
'title': title,
|
|
'description': video.get('description'),
|
|
'thumbnail': urljoin(url, video.get('thumbnailPath')),
|
|
'timestamp': unified_timestamp(video.get('publishedAt')),
|
|
'uploader': account_data('displayName'),
|
|
'uploader_id': account_data('uuid'),
|
|
'uploder_url': account_data('url'),
|
|
'license': try_get(
|
|
video, lambda x: x['licence']['label'], compat_str),
|
|
'duration': int_or_none(video.get('duration')),
|
|
'view_count': int_or_none(video.get('views')),
|
|
'like_count': int_or_none(video.get('likes')),
|
|
'dislike_count': int_or_none(video.get('dislikes')),
|
|
'age_limit': age_limit,
|
|
'tags': try_get(video, lambda x: x['tags'], list),
|
|
'categories': categories,
|
|
'formats': formats,
|
|
}
|