[cspan] Fix extraction (fixes #8032)

2024-11-21 20:46:36 -05:00 · 2015-12-28 13:48:10 +01:00 · 2015-12-28 13:48:10 +01:00 · 6c6b8bd5cc
commit 6c6b8bd5cc
parent 04e24906be
1 changed files with 6 additions and 4 deletions
--- a/youtube_dl/extractor/cspan.py
+++ b/youtube_dl/extractor/cspan.py
@ -60,11 +60,13 @@ def _real_extract(self, url):
        video_id = self._match_id(url)
        video_type = None
        webpage = self._download_webpage(url, video_id)
-        matches = re.search(r'data-(prog|clip)id=\'([0-9]+)\'', webpage)
+        # We first look for clipid, because clipprog always appears before
-        if matches:
+        patterns = [r'id=\'clip(%s)\'\s*value=\'([0-9]+)\'' % t for t in ('id', 'prog')]
        results = list(filter(None, (re.search(p, webpage) for p in patterns)))
        if results:
            matches = results[0]
            video_type, video_id = matches.groups()
-            if video_type == 'prog':
+            video_type = 'clip' if video_type == 'id' else 'program'
                video_type = 'program'
        else:
            senate_isvp_url = SenateISVPIE._search_iframe_url(webpage)
            if senate_isvp_url: