[facebook] Fix extraction (closes #12323)

Almost all videos now use the pagelet type 'permalink_video_pagelet'
This commit is contained in:
Yen Chi Hsuan 2017-03-02 20:49:39 +08:00
parent c9612c0487
commit 11bb6ad1a5
No known key found for this signature in database
GPG key ID: 7F902A182457CA23
2 changed files with 7 additions and 1 deletions

View file

@ -1,3 +1,9 @@
version <unreleased>
Extractors
* [facebook] Fix extraction (#12323)
version 2017.02.28
Core

View file

@ -303,7 +303,7 @@ def extract_video_data(instances):
if not video_data:
server_js_data = self._parse_json(
self._search_regex(
r'bigPipe\.onPageletArrive\(({.+?})\)\s*;\s*}\s*\)\s*,\s*["\']onPageletArrive\s+(?:stream_pagelet|pagelet_group_mall)',
r'bigPipe\.onPageletArrive\(({.+?})\)\s*;\s*}\s*\)\s*,\s*["\']onPageletArrive\s+(?:stream_pagelet|pagelet_group_mall|permalink_video_pagelet)',
webpage, 'js data', default='{}'),
video_id, transform_source=js_to_json, fatal=False)
if server_js_data: