streamcz.py 1.9 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364
  1. # -*- coding: utf-8 -*-
  2. from __future__ import unicode_literals
  3. import re
  4. import json
  5. from .common import InfoExtractor
  6. class StreamCZIE(InfoExtractor):
  7. _VALID_URL = r'https?://www\.stream\.cz/((?P<category>.+)/)?(?P<videogroup>.+)/(?P<videoid>.+)'
  8. _TESTS = [{
  9. 'url': 'http://www.stream.cz/peklonataliri/765767-ecka-pro-deti',
  10. 'md5': '6d3ca61a8d0633c9c542b92fcb936b0c',
  11. 'info_dict': {
  12. 'id': '765767',
  13. 'ext': 'mp4',
  14. 'title': 'Peklo na talíři: Éčka pro děti',
  15. 'description': 'md5:49ace0df986e95e331d0fe239d421519',
  16. 'thumbnail': 'http://im.stream.cz/episode/52961d7e19d423f8f06f0100',
  17. },
  18. },
  19. ]
  20. def _real_extract(self, url):
  21. mobj = re.match(self._VALID_URL, url)
  22. video_id = mobj.group('videoid')
  23. webpage = self._download_webpage(url, video_id)
  24. data = self._html_search_regex(r'Stream\.Data\.Episode\((.+?)\);', webpage, 'stream data')
  25. jsonData = json.loads(data)
  26. formats = []
  27. for video in jsonData['instances']:
  28. format_id = video['instances'][0]['quality']
  29. if format_id == '240p':
  30. quality = 0
  31. elif format_id == '360p':
  32. quality = 1
  33. elif format_id == '480p':
  34. quality = 2
  35. elif format_id == '720p':
  36. quality = 3
  37. formats.append({
  38. 'format_id': format_id,
  39. 'url': video['instances'][0]['source'],
  40. 'quality': quality,
  41. 'ext': 'mp4',
  42. })
  43. self._sort_formats(formats)
  44. return {
  45. 'id': str(jsonData['id']),
  46. 'title': self._og_search_title(webpage),
  47. 'thumbnail': jsonData['episode_image_original_url'].replace('//', 'http://'),
  48. 'formats': formats,
  49. 'description': self._og_search_description(webpage),
  50. }