Browse Source

[cspan] Fix extraction (fixes #8032)

Jaime Marquínez Ferrándiz 9 năm trước cách đây
mục cha
commit
6c6b8bd5cc
1 tập tin đã thay đổi với 6 bổ sung4 xóa
  1. 6 4
      youtube_dl/extractor/cspan.py

+ 6 - 4
youtube_dl/extractor/cspan.py

@@ -60,11 +60,13 @@ class CSpanIE(InfoExtractor):
         video_id = self._match_id(url)
         video_type = None
         webpage = self._download_webpage(url, video_id)
-        matches = re.search(r'data-(prog|clip)id=\'([0-9]+)\'', webpage)
-        if matches:
+        # We first look for clipid, because clipprog always appears before
+        patterns = [r'id=\'clip(%s)\'\s*value=\'([0-9]+)\'' % t for t in ('id', 'prog')]
+        results = list(filter(None, (re.search(p, webpage) for p in patterns)))
+        if results:
+            matches = results[0]
             video_type, video_id = matches.groups()
-            if video_type == 'prog':
-                video_type = 'program'
+            video_type = 'clip' if video_type == 'id' else 'program'
         else:
             senate_isvp_url = SenateISVPIE._search_iframe_url(webpage)
             if senate_isvp_url: