wimp.py 1020 B

1234567891011121314151617181920212223242526
  1. import re
  2. import base64
  3. from .common import InfoExtractor
  4. class WimpIE(InfoExtractor):
  5. _VALID_URL = r'(?:http://)?(?:www\.)?wimp\.com/([^/]+)/'
  6. def _real_extract(self, url):
  7. mobj = re.match(self._VALID_URL, url)
  8. video_id = mobj.group(1)
  9. webpage = self._download_webpage(url, video_id)
  10. title = self._search_regex('\<meta name\="description" content="(.+?)" \/\>',webpage, 'video title')
  11. thumbnail_url = self._search_regex('\<meta property\=\"og\:image" content\=\"(.+?)\" />',webpage,'video thumbnail')
  12. googleString = self._search_regex("googleCode = '(.*?)'", webpage,'file url')
  13. googleString = base64.b64decode(googleString)
  14. final_url = self._search_regex(b'","(.*?)"', googleString,'final video url')
  15. ext = final_url.split('.')[-1]
  16. return [{
  17. 'id': video_id,
  18. 'url': final_url,
  19. 'ext': ext,
  20. 'title': title,
  21. 'thumbnail': thumbnail_url,
  22. }]