keek.py 1.4 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243
  1. # coding: utf-8
  2. from __future__ import unicode_literals
  3. import re
  4. from .common import InfoExtractor
  5. class KeekIE(InfoExtractor):
  6. _VALID_URL = r'https?://(?:www\.)?keek\.com/keek/(?P<id>\w+)'
  7. IE_NAME = 'keek'
  8. _TEST = {
  9. 'url': 'https://www.keek.com/keek/NODfbab',
  10. 'md5': '9b0636f8c0f7614afa4ea5e4c6e57e83',
  11. 'info_dict': {
  12. 'id': 'NODfbab',
  13. 'ext': 'mp4',
  14. 'title': 'test chars: "\'/\\ä<>This is a test video for youtube-dl.For more information, contact phihag@phihag.de . - Video - Videos on Keek',
  15. 'description': 'md5:35d42050a3ece241d5ddd7fdcc6fd896',
  16. 'uploader': 'ytdl',
  17. 'uploader_id': 'eGT5bab',
  18. },
  19. }
  20. def _real_extract(self, url):
  21. video_id = self._match_id(url)
  22. webpage = self._download_webpage(url, video_id)
  23. uploader = uploader_id = None
  24. matches = re.search(r'data-username="(?P<uploader>[^"]+)"[^>]*data-user-id="(?P<uploader_id>[^"]+)"', webpage)
  25. if matches:
  26. uploader, uploader_id = matches.groups()
  27. return {
  28. 'id': video_id,
  29. 'url': self._og_search_video_url(webpage),
  30. 'ext': 'mp4',
  31. 'title': self._og_search_title(webpage),
  32. 'description': self._og_search_description(webpage),
  33. 'thumbnail': self._og_search_thumbnail(webpage),
  34. 'uploader': uploader,
  35. 'uploader_id': uploader_id,
  36. }