keek.py 1.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142
  1. from __future__ import unicode_literals
  2. import re
  3. from .common import InfoExtractor
  4. class KeekIE(InfoExtractor):
  5. _VALID_URL = r'https?://(?:www\.)?keek\.com/keek/(?P<id>\w+)'
  6. IE_NAME = 'keek'
  7. _TEST = {
  8. 'url': 'https://www.keek.com/keek/NODfbab',
  9. 'md5': '9b0636f8c0f7614afa4ea5e4c6e57e83',
  10. 'info_dict': {
  11. 'id': 'NODfbab',
  12. 'ext': 'mp4',
  13. 'title': 'test chars: "\'/\\ä<>This is a test video for youtube-dl.For more information, contact phihag@phihag.de . - Video - Videos on Keek',
  14. 'description': 'test chars: "\'/\\ä<>This is a test video for youtube-dl.For more information, contact phihag@phihag.de .',
  15. 'uploader': 'ytdl',
  16. 'uploader_id': 'eGT5bab',
  17. },
  18. }
  19. def _real_extract(self, url):
  20. video_id = self._match_id(url)
  21. webpage = self._download_webpage(url, video_id)
  22. uploader = uploader_id = None
  23. matches = re.search(r'data-username="(?P<uploader>[^"]+)"[^>]*data-user-id="(?P<uploader_id>[^"]+)"', webpage)
  24. if matches:
  25. uploader, uploader_id = matches.groups()
  26. return {
  27. 'id': video_id,
  28. 'url': self._og_search_video_url(webpage),
  29. 'ext': 'mp4',
  30. 'title': self._og_search_title(webpage),
  31. 'description': self._og_search_description(webpage),
  32. 'thumbnail': self._og_search_thumbnail(webpage),
  33. 'uploader': uploader,
  34. 'uploader_id': uploader_id,
  35. }