浏览代码

[cspan] Fix extraction (fixes #8032)

Jaime Marquínez Ferrándiz 9 年之前
父节点
当前提交
6c6b8bd5cc
共有 1 个文件被更改,包括 6 次插入4 次删除
  1. 6 4
      youtube_dl/extractor/cspan.py

+ 6 - 4
youtube_dl/extractor/cspan.py

@@ -60,11 +60,13 @@ class CSpanIE(InfoExtractor):
         video_id = self._match_id(url)
         video_type = None
         webpage = self._download_webpage(url, video_id)
-        matches = re.search(r'data-(prog|clip)id=\'([0-9]+)\'', webpage)
-        if matches:
+        # We first look for clipid, because clipprog always appears before
+        patterns = [r'id=\'clip(%s)\'\s*value=\'([0-9]+)\'' % t for t in ('id', 'prog')]
+        results = list(filter(None, (re.search(p, webpage) for p in patterns)))
+        if results:
+            matches = results[0]
             video_type, video_id = matches.groups()
-            if video_type == 'prog':
-                video_type = 'program'
+            video_type = 'clip' if video_type == 'id' else 'program'
         else:
             senate_isvp_url = SenateISVPIE._search_iframe_url(webpage)
             if senate_isvp_url: