[youku] Fix list extraction.(close #15065)

Change-Id: I578fdc5b69509bdcd8d3191e3917afe47c234ff6
This commit is contained in:
JianxinLi 2017-12-24 00:30:27 +08:00 committed by Yen Chi Hsuan
parent a75419586b
commit d99a1000c7

View file

@ -276,9 +276,9 @@ def _real_extract(self, url):
r'<div[^>]+id="(reload_\d+)', first_page, 'first page reload id') r'<div[^>]+id="(reload_\d+)', first_page, 'first page reload id')
# The first reload_id has the same items as first_page # The first reload_id has the same items as first_page
reload_ids = re.findall('<li[^>]+data-id="([^"]+)">', first_page) reload_ids = re.findall('<li[^>]+data-id="([^"]+)">', first_page)
entries.extend(initial_entries)
for idx, reload_id in enumerate(reload_ids): for idx, reload_id in enumerate(reload_ids):
if reload_id == first_page_reload_id: if reload_id == first_page_reload_id:
entries.extend(initial_entries)
continue continue
_, new_entries = self._extract_entries( _, new_entries = self._extract_entries(
'http://list.youku.com/show/episode', show_id, 'http://list.youku.com/show/episode', show_id,