Browse Source

[toypics] Fix extraction

vobe 8 years ago
parent
commit
77d682da9d
1 changed files with 8 additions and 7 deletions
  1. 8 7
      youtube_dl/extractor/toypics.py

+ 8 - 7
youtube_dl/extractor/toypics.py

@@ -24,15 +24,16 @@ class ToypicsIE(InfoExtractor):
         mobj = re.match(self._VALID_URL, url)
         mobj = re.match(self._VALID_URL, url)
         video_id = mobj.group('id')
         video_id = mobj.group('id')
         page = self._download_webpage(url, video_id)
         page = self._download_webpage(url, video_id)
-        video_url = self._html_search_regex(
-            r'src:\s+"(http://static[0-9]+\.toypics\.net/flvideo/[^"]+)"', page, 'video URL')
-        title = self._html_search_regex(
-            r'<title>Toypics - ([^<]+)</title>', page, 'title')
+        formats = self._parse_html5_media_entries(url, page, video_id)[0]['formats']
+        title = self._html_search_regex([
+            r'<h1[^>]+class=["\']view-video-title[^>]+>([^<]+)</h',
+            r'<title>([^<]+) - Toypics</title>',
+        ], page, 'title')
         username = self._html_search_regex(
         username = self._html_search_regex(
-            r'toypics.net/([^/"]+)" class="user-name">', page, 'username')
+            r'More videos from <strong>([^<]+)</strong>', page, 'username')
         return {
         return {
             'id': video_id,
             'id': video_id,
-            'url': video_url,
+            'formats': formats,
             'title': title,
             'title': title,
             'uploader': username,
             'uploader': username,
             'age_limit': 18,
             'age_limit': 18,
@@ -71,7 +72,7 @@ class ToypicsUserIE(InfoExtractor):
                 note='Downloading page %d/%d' % (n, page_count))
                 note='Downloading page %d/%d' % (n, page_count))
             urls.extend(
             urls.extend(
                 re.findall(
                 re.findall(
-                    r'<p class="video-entry-title">\s+<a href="(https?://videos.toypics.net/view/[^"]+)">',
+                    r'<div[^>]+class=["\']preview[^>]+>\s*<a[^>]+href="(https?://videos.toypics.net/view/[^"]+)"',
                     lpage))
                     lpage))
 
 
         return {
         return {