[faz] Use a regex for getting the description

The page cannot be parsed in python2.6 with the html parser.
2024-11-21 20:46:36 -05:00 · 2013-10-27 14:18:55 +01:00 · 2013-10-27 14:18:55 +01:00 · af4d506eb3
commit af4d506eb3
parent 749a4fd2fd
1 changed files with 2 additions and 4 deletions
--- a/youtube_dl/extractor/faz.py
+++ b/youtube_dl/extractor/faz.py
@ -5,8 +5,6 @@
 from .common import InfoExtractor
 from ..utils import (
    determine_ext,
    clean_html,
    get_element_by_attribute,
 )
@ -47,12 +45,12 @@ def _real_extract(self, url):
                'format_id': code.lower(),
            })
-        descr_html = get_element_by_attribute('class', 'Content Copy', webpage)
+        descr = self._html_search_regex(r'<p class="Content Copy">(.*?)</p>', webpage, u'description')
        info = {
            'id': video_id,
            'title': self._og_search_title(webpage),
            'formats': formats,
-            'description': clean_html(descr_html),
+            'description': descr,
            'thumbnail': config.find('STILL/STILL_BIG').text,
        }
        # TODO: Remove when #980 has been merged