[extractor/generic] Properly extract format id from Content-Type

Fixes extraction for cases like: audio/x-mpegURL; charset=utf-8
2025-04-20 19:13:17 +00:00 · 2016-03-18 21:50:10 +06:00 · 2016-03-18 21:50:10 +06:00 · 263eff9537
commit 263eff9537
parent cae21032ab
1 changed files with 1 additions and 1 deletions
--- a/youtube_dl/extractor/generic.py
+++ b/youtube_dl/extractor/generic.py
@ -1249,7 +1249,7 @@ class GenericIE(InfoExtractor):

        # Check for direct link to a video
        content_type = head_response.headers.get('Content-Type', '')
-        m = re.match(r'^(?P<type>audio|video|application(?=/(?:ogg$|(?:vnd\.apple\.|x-)?mpegurl)))/(?P<format_id>.+)$', content_type)
+        m = re.match(r'^(?P<type>audio|video|application(?=/(?:ogg$|(?:vnd\.apple\.|x-)?mpegurl)))/(?P<format_id>[^;\s]+)', content_type)
        if m:
            upload_date = unified_strdate(
                head_response.headers.get('Last-Modified'))