rtvnh.py 1.3 KB

123456789101112131415161718192021222324252627282930313233343536
  1. # coding: utf-8
  2. from __future__ import unicode_literals
  3. from .common import InfoExtractor
  4. class RTVNHIE(InfoExtractor):
  5. _VALID_URL = r'https?://(?:www\.)?rtvnh\.nl/video/(?P<id>[0-9]+)'
  6. _TEST = {
  7. 'url': 'http://www.rtvnh.nl/video/131946',
  8. 'md5': '6e1d0ab079e2a00b6161442d3ceacfc1',
  9. 'info_dict': {
  10. 'id': '131946',
  11. 'ext': 'mp4',
  12. 'title': 'Grote zoektocht in zee bij Zandvoort naar vermiste vrouw',
  13. 'thumbnail': 're:^https?:.*\.jpg$'
  14. }
  15. }
  16. def _real_extract(self, url):
  17. video_id = self._match_id(url)
  18. meta = self._parse_json(self._download_webpage('http://www.rtvnh.nl/video/json?m=' + video_id, video_id), video_id)
  19. formats = self._extract_smil_formats('http://www.rtvnh.nl/video/smil?m=' + video_id, video_id)
  20. for item in meta['source']['fb']:
  21. if item.get('type') == 'hls':
  22. formats.extend(self._extract_m3u8_formats(item['file'], video_id, ext='mp4', entry_protocol='m3u8_native'))
  23. elif item.get('type') == '':
  24. formats.append({'url': item['file']})
  25. return {
  26. 'id': video_id,
  27. 'title': meta['title'].strip(),
  28. 'thumbnail': meta['image'],
  29. 'formats': formats
  30. }