Browse Source

[auengine] Simplify

Philipp Hagemeister 12 years ago
parent
commit
9906d397a0
1 changed files with 17 additions and 13 deletions
  1. 17 13
      youtube_dl/extractor/auengine.py

+ 17 - 13
youtube_dl/extractor/auengine.py

@@ -1,10 +1,10 @@
-import os.path
 import re
 import re
 
 
 from .common import InfoExtractor
 from .common import InfoExtractor
 from ..utils import (
 from ..utils import (
     compat_urllib_parse,
     compat_urllib_parse,
-    compat_urllib_parse_urlparse,
+    determine_ext,
+    ExtractorError,
 )
 )
 
 
 class AUEngineIE(InfoExtractor):
 class AUEngineIE(InfoExtractor):
@@ -25,22 +25,26 @@ class AUEngineIE(InfoExtractor):
         title = self._html_search_regex(r'<title>(?P<title>.+?)</title>',
         title = self._html_search_regex(r'<title>(?P<title>.+?)</title>',
                 webpage, u'title')
                 webpage, u'title')
         title = title.strip()
         title = title.strip()
-        links = re.findall(r'[^A-Za-z0-9]?(?:file|url):\s*["\'](http[^\'"&]*)', webpage)
-        links = [compat_urllib_parse.unquote(l) for l in links]
+        links = re.findall(r'\s(?:file|url):\s*["\']([^\'"]+)["\']', webpage)
+        links = map(compat_urllib_parse.unquote, links)
+
+        thumbnail = None
+        video_url = None
         for link in links:
         for link in links:
-            root, pathext = os.path.splitext(compat_urllib_parse_urlparse(link).path)
-            if pathext == '.png':
+            if link.endswith('.png'):
                 thumbnail = link
                 thumbnail = link
-            elif pathext == '.mp4':
-                url = link
-                ext = pathext
+            elif '/videos/' in link:
+                video_url = link
+        if not video_url:
+            raise ExtractorError(u'Could not find video URL')
+        ext = u'.' + determine_ext(video_url)
         if ext == title[-len(ext):]:
         if ext == title[-len(ext):]:
             title = title[:-len(ext)]
             title = title[:-len(ext)]
-        ext = ext[1:]
-        return [{
+
+        return {
             'id':        video_id,
             'id':        video_id,
-            'url':       url,
+            'url':       video_url,
             'ext':       ext,
             'ext':       ext,
             'title':     title,
             'title':     title,
             'thumbnail': thumbnail,
             'thumbnail': thumbnail,
-        }]
+        }