mirror of
https://github.com/yt-dlp/yt-dlp.git
synced 2024-11-07 20:30:41 -05:00
[extractor/Scrolller] Add extractor (#4010)
Closes #3635 Authored by: LunarFang416
This commit is contained in:
parent
962ffcf89c
commit
2c60eae899
2 changed files with 105 additions and 0 deletions
|
@ -1511,6 +1511,7 @@
|
||||||
SCTEIE,
|
SCTEIE,
|
||||||
SCTECourseIE,
|
SCTECourseIE,
|
||||||
)
|
)
|
||||||
|
from .scrolller import ScrolllerIE
|
||||||
from .seeker import SeekerIE
|
from .seeker import SeekerIE
|
||||||
from .senategov import SenateISVPIE, SenateGovIE
|
from .senategov import SenateISVPIE, SenateGovIE
|
||||||
from .sendtonews import SendtoNewsIE
|
from .sendtonews import SendtoNewsIE
|
||||||
|
|
104
yt_dlp/extractor/scrolller.py
Normal file
104
yt_dlp/extractor/scrolller.py
Normal file
|
@ -0,0 +1,104 @@
|
||||||
|
import json
|
||||||
|
|
||||||
|
from .common import InfoExtractor
|
||||||
|
from ..utils import determine_ext, int_or_none
|
||||||
|
|
||||||
|
|
||||||
|
class ScrolllerIE(InfoExtractor):
|
||||||
|
_VALID_URL = r'https?://(?:www\.)?scrolller\.com/(?P<id>[\w-]+)'
|
||||||
|
_TESTS = [{
|
||||||
|
'url': 'https://scrolller.com/a-helping-hand-1k9pxikxkw',
|
||||||
|
'info_dict': {
|
||||||
|
'id': 'a-helping-hand-1k9pxikxkw',
|
||||||
|
'ext': 'mp4',
|
||||||
|
'thumbnail': 'https://zepto.scrolller.com/a-helping-hand-3ty9q8x094-540x960.jpg',
|
||||||
|
'title': 'A helping hand',
|
||||||
|
'age_limit': 0,
|
||||||
|
}
|
||||||
|
}, {
|
||||||
|
'url': 'https://scrolller.com/tigers-chasing-a-drone-c5d1f2so6j',
|
||||||
|
'info_dict': {
|
||||||
|
'id': 'tigers-chasing-a-drone-c5d1f2so6j',
|
||||||
|
'ext': 'mp4',
|
||||||
|
'thumbnail': 'https://zepto.scrolller.com/tigers-chasing-a-drone-az9pkpguwe-540x303.jpg',
|
||||||
|
'title': 'Tigers chasing a drone',
|
||||||
|
'age_limit': 0,
|
||||||
|
}
|
||||||
|
}, {
|
||||||
|
'url': 'https://scrolller.com/baby-rhino-smells-something-9chhugsv9p',
|
||||||
|
'info_dict': {
|
||||||
|
'id': 'baby-rhino-smells-something-9chhugsv9p',
|
||||||
|
'ext': 'mp4',
|
||||||
|
'thumbnail': 'https://atto.scrolller.com/hmm-whats-that-smell-bh54mf2c52-300x224.jpg',
|
||||||
|
'title': 'Baby rhino smells something',
|
||||||
|
'age_limit': 0,
|
||||||
|
}
|
||||||
|
}, {
|
||||||
|
'url': 'https://scrolller.com/its-all-fun-and-games-cco8jjmoh7',
|
||||||
|
'info_dict': {
|
||||||
|
'id': 'its-all-fun-and-games-cco8jjmoh7',
|
||||||
|
'ext': 'mp4',
|
||||||
|
'thumbnail': 'https://atto.scrolller.com/its-all-fun-and-games-3amk9vg7m3-540x649.jpg',
|
||||||
|
'title': 'It\'s all fun and games...',
|
||||||
|
'age_limit': 0,
|
||||||
|
}
|
||||||
|
}, {
|
||||||
|
'url': 'https://scrolller.com/may-the-force-be-with-you-octokuro-yeytg1fs7a',
|
||||||
|
'info_dict': {
|
||||||
|
'id': 'may-the-force-be-with-you-octokuro-yeytg1fs7a',
|
||||||
|
'ext': 'mp4',
|
||||||
|
'thumbnail': 'https://thumbs2.redgifs.com/DarkStarchyNautilus-poster.jpg',
|
||||||
|
'title': 'May the force be with you (Octokuro)',
|
||||||
|
'age_limit': 18,
|
||||||
|
}
|
||||||
|
}]
|
||||||
|
|
||||||
|
def _real_extract(self, url):
|
||||||
|
video_id = self._match_id(url)
|
||||||
|
|
||||||
|
query = {
|
||||||
|
'query': '''{
|
||||||
|
getSubredditPost(url:"/%s"){
|
||||||
|
id
|
||||||
|
title
|
||||||
|
isNsfw
|
||||||
|
mediaSources{
|
||||||
|
url
|
||||||
|
width
|
||||||
|
height
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}''' % video_id
|
||||||
|
}
|
||||||
|
|
||||||
|
video_data = self._download_json(
|
||||||
|
'https://api.scrolller.com/api/v2/graphql', video_id, data=json.dumps(query).encode(),
|
||||||
|
headers={'Content-Type': 'application/json'})['data']['getSubredditPost']
|
||||||
|
|
||||||
|
formats, thumbnails = [], []
|
||||||
|
for source in video_data['mediaSources']:
|
||||||
|
if determine_ext(source.get('url')) in ('jpg', 'png'):
|
||||||
|
thumbnails.append({
|
||||||
|
'url': source['url'],
|
||||||
|
'width': int_or_none(source.get('width')),
|
||||||
|
'height': int_or_none(source.get('height')),
|
||||||
|
})
|
||||||
|
elif source.get('url'):
|
||||||
|
formats.append({
|
||||||
|
'url': source['url'],
|
||||||
|
'width': int_or_none(source.get('width')),
|
||||||
|
'height': int_or_none(source.get('height')),
|
||||||
|
})
|
||||||
|
|
||||||
|
if not formats:
|
||||||
|
self.raise_no_formats('There is no video.', expected=True, video_id=video_id)
|
||||||
|
|
||||||
|
self._sort_formats(formats)
|
||||||
|
|
||||||
|
return {
|
||||||
|
'id': video_id,
|
||||||
|
'title': video_data.get('title'),
|
||||||
|
'thumbnails': thumbnails,
|
||||||
|
'formats': formats,
|
||||||
|
'age_limit': 18 if video_data.get('isNsfw') else 0
|
||||||
|
}
|
Loading…
Reference in a new issue