shahid.py 2.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081
  1. # coding: utf-8
  2. from __future__ import unicode_literals
  3. from .common import InfoExtractor
  4. from ..utils import (
  5. js_to_json,
  6. ExtractorError,
  7. int_or_none
  8. )
  9. class ShahidIE(InfoExtractor):
  10. _VALID_URL = r'https?://shahid\.mbc\.net/ar/episode/(?P<id>\d+)/?'
  11. _TESTS = [
  12. {
  13. 'url': 'https://shahid.mbc.net/ar/episode/108084/%D8%AE%D9%88%D8%A7%D8%B7%D8%B1-%D8%A7%D9%84%D9%85%D9%88%D8%B3%D9%85-11-%D8%A7%D9%84%D8%AD%D9%84%D9%82%D8%A9-1.html',
  14. 'info_dict': {
  15. 'id': '108084',
  16. 'ext': 'm3u8',
  17. 'title': 'خواطر الموسم 11 الحلقة 1',
  18. 'description': 'بسم الله',
  19. 'duration': 1166,
  20. },
  21. 'params': {
  22. # m3u8 download
  23. 'skip_download': True,
  24. }
  25. },
  26. {
  27. # shahid plus subscriber only
  28. 'url': 'https://shahid.mbc.net/ar/series/90497/%D9%85%D8%B1%D8%A7%D9%8A%D8%A7-2011.html',
  29. 'only_matching': True
  30. }
  31. ]
  32. def _real_extract(self, url):
  33. video_id = self._match_id(url)
  34. webpage = self._download_webpage(url, video_id)
  35. player_info = ''
  36. for line in self._search_regex('var flashvars = ({[^}]+})', webpage, 'flashvars').splitlines():
  37. if '+' not in line and '(' not in line and ')' not in line:
  38. player_info += line
  39. player_info = self._parse_json(js_to_json(player_info), video_id)
  40. video_id = player_info['id']
  41. player_type = player_info['playerType']
  42. player_json_data = self._download_json(
  43. 'https://shahid.mbc.net/arContent/getPlayerContent-param-.id-' + video_id + '.type-' + player_info['type'] + '.html',
  44. video_id
  45. )['data']
  46. if 'url' in player_json_data:
  47. m3u8_url = player_json_data['url']
  48. else:
  49. for error in player_json_data['error'].values():
  50. raise ExtractorError(error)
  51. formats = self._extract_m3u8_formats(m3u8_url, video_id)
  52. video_info = self._download_json(
  53. player_info['url'] + '/' + player_type + '/' + video_id + '?apiKey=sh%40hid0nlin3&hash=b2wMCTHpSmyxGqQjJFOycRmLSex%2BBpTK%2Fooxy6vHaqs%3D',
  54. video_id
  55. )['data']
  56. if video_info.get('error'):
  57. for error in video_info['error']:
  58. raise ExtractorError(error)
  59. video_info = video_info[player_type]
  60. title = video_info['title']
  61. thumbnail = video_info.get('thumbnailUrl')
  62. categories = [category['name'] for category in video_info.get('genres')]
  63. description = video_info.get('description')
  64. duration = int_or_none(video_info.get('duration'))
  65. return {
  66. 'id': video_id,
  67. 'title': title,
  68. 'thumbnail': thumbnail,
  69. 'categories': categories,
  70. 'description': description,
  71. 'duration': duration,
  72. 'formats': formats,
  73. }