Ver Fonte

[yahoo] Add another content id regex (closes #11088)

Sergey M․ há 9 anos atrás
pai
commit
f420902a3b
1 ficheiros alterados com 14 adições e 0 exclusões
  1. 14 0
      youtube_dl/extractor/yahoo.py

+ 14 - 0
youtube_dl/extractor/yahoo.py

@@ -201,6 +201,19 @@ class YahooIE(InfoExtractor):
             },
             },
             'skip': 'redirect to https://www.yahoo.com/music',
             'skip': 'redirect to https://www.yahoo.com/music',
         },
         },
+        {
+            # ytwnews://cavideo/
+            'url': 'https://tw.video.yahoo.com/movie-tw/單車天使-中文版預-092316541.html',
+            'info_dict': {
+                'id': 'ba133ff2-0793-3510-b636-59dfe9ff6cff',
+                'ext': 'mp4',
+                'title': '單車天使 - 中文版預',
+                'description': '中文版預',
+            },
+            'params': {
+                'skip_download': True,
+            },
+        },
     ]
     ]
 
 
     def _real_extract(self, url):
     def _real_extract(self, url):
@@ -270,6 +283,7 @@ class YahooIE(InfoExtractor):
                     r'%s[^}]*"ccm_id"\s*:\s*"([^"]+)"' % re.escape(page_id),
                     r'%s[^}]*"ccm_id"\s*:\s*"([^"]+)"' % re.escape(page_id),
                     r'<article[^>]data-uuid=["\']([^"\']+)',
                     r'<article[^>]data-uuid=["\']([^"\']+)',
                     r'yahoo://article/view\?.*\buuid=([^&"\']+)',
                     r'yahoo://article/view\?.*\buuid=([^&"\']+)',
+                    r'<meta[^<>]+["\']ytwnews://cavideo/(?:[^/]+/)+([\da-fA-F-]+)[&"\']',
                 ]
                 ]
                 video_id = self._search_regex(
                 video_id = self._search_regex(
                     CONTENT_ID_REGEXES, webpage, 'content ID')
                     CONTENT_ID_REGEXES, webpage, 'content ID')