lcp.py 1.5 KB

123456789101112131415161718192021222324252627282930313233343536373839
  1. # coding: utf-8
  2. from __future__ import unicode_literals
  3. from .common import InfoExtractor
  4. class LcpIE(InfoExtractor):
  5. IE_NAME = 'LCP'
  6. _VALID_URL = r'https?://(?:www\.)?lcp\.fr/(?:[^\/]+/)*(?P<id>[^/]+)'
  7. _TESTS = [{
  8. 'url': 'http://www.lcp.fr/la-politique-en-video/schwartzenberg-prg-preconise-francois-hollande-de-participer-une-primaire',
  9. 'md5': 'ab96c4dae94322ece1e98d97c8dc7807',
  10. 'info_dict': {
  11. 'id': 'd56d03e9',
  12. 'url': 're:http://httpod.scdn.arkena.com/11970/d56d03e9_.*',
  13. 'ext': 'mp4',
  14. 'title': 'd56d03e9',
  15. 'upload_date': '20160226',
  16. 'timestamp': 1456488895
  17. }
  18. }, {
  19. 'url': 'http://www.lcp.fr/le-direct',
  20. 'info_dict': {
  21. 'title': 'Le direct | LCP Assembl\xe9e nationale',
  22. 'id': 'le-direct',
  23. },
  24. 'playlist_mincount': 1
  25. }]
  26. def _real_extract(self, url):
  27. display_id = self._match_id(url)
  28. webpage = self._download_webpage(url, display_id)
  29. embed_url_regex = r'"(?P<url>(?:https?://(?:www\.)?)?play\.lcp\.fr/embed/[A-za-z0-9]+/[A-za-z0-9]+/[A-za-z0-9]+/[A-za-z0-9]+)"'
  30. embed_url = self._html_search_regex(embed_url_regex, webpage, 'player_url', default=None, fatal=False)
  31. if not embed_url:
  32. return self.url_result(url, 'Generic')
  33. title = self._og_search_title(webpage, default=None)
  34. return self.url_result(embed_url, 'ArkenaPlay', video_id=display_id, video_title=title)