From b7a7319c388e3a33851d87b589586abb6796a0e5 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Sergey=20M=E2=80=A4?= Date: Thu, 1 Jan 2015 00:26:19 +0600 Subject: [PATCH] [slideshare] Fix extraction --- youtube_dl/extractor/slideshare.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/youtube_dl/extractor/slideshare.py b/youtube_dl/extractor/slideshare.py index e7d776e7b..9f79ff5c1 100644 --- a/youtube_dl/extractor/slideshare.py +++ b/youtube_dl/extractor/slideshare.py @@ -30,7 +30,7 @@ def _real_extract(self, url): page_title = mobj.group('title') webpage = self._download_webpage(url, page_title) slideshare_obj = self._search_regex( - r'var slideshare_object = ({.*?}); var user_info =', + r'var\s+slideshare_object\s*=\s*({.*?});\s*var\s+user_info\s*=', webpage, 'slideshare object') info = json.loads(slideshare_obj) if info['slideshow']['type'] != 'video': @@ -41,7 +41,7 @@ def _real_extract(self, url): ext = info['jsplayer']['video_extension'] video_url = compat_urlparse.urljoin(bucket, doc + '-SD.' + ext) description = self._html_search_regex( - r']*>(.*?)

', webpage, + r'(?s)]+itemprop="description"[^>]*>(.+?)

', webpage, 'description', fatal=False) return {