ustudio.py 1.9 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758
  1. # coding: utf-8
  2. from __future__ import unicode_literals
  3. from .common import InfoExtractor
  4. from ..utils import int_or_none
  5. class UstudioIE(InfoExtractor):
  6. IE_NAME = 'uStudio'
  7. _VALID_URL = r'http://(?:www\.|v1\.)?ustudio.com/video/(?P<id>[\w\d]+)/.+'
  8. _TESTS = [
  9. {
  10. 'url': 'http://ustudio.com/video/Uxu2my9bgSph/san_francisco_golden_gate_bridge',
  11. 'md5': '58bbfca62125378742df01fc2abbdef6',
  12. 'info_dict': {
  13. 'id': 'Uxu2my9bgSph',
  14. 'ext': 'mp4',
  15. 'title': 'San Francisco: Golden Gate Bridge',
  16. 'thumbnail': 're:^https?://.*\.jpg$',
  17. 'description': 'md5:23925500697f2c6d4830e387ba51a9be',
  18. 'uploader': 'Tony Farley',
  19. }
  20. },
  21. ]
  22. def _real_extract(self, url):
  23. video_id = self._match_id(url)
  24. webpage = self._download_webpage(url, video_id)
  25. doc = self._download_xml(
  26. 'http://v1.ustudio.com/embed/{0}/ustudio/config.xml'.format(
  27. video_id),
  28. video_id,
  29. note='Downloading video info',
  30. errnote='Failed to download video info')
  31. formats = [
  32. {
  33. 'url': quality.attrib['url'],
  34. 'width': int_or_none(quality.attrib.get('width')),
  35. 'height': int_or_none(quality.attrib.get('height')),
  36. } for quality in doc.findall('./qualities/quality/video')
  37. ]
  38. self._sort_formats(formats)
  39. return {
  40. 'id': video_id,
  41. 'title': self._og_search_title(webpage),
  42. 'thumbnail': self._og_search_thumbnail(webpage),
  43. 'formats': formats,
  44. 'description': self._og_search_description(webpage),
  45. 'uploader': self._html_search_regex(
  46. r'<a href=".*/user/.+">(.+)</a> on',
  47. webpage,
  48. 'uploader',
  49. fatal=False),
  50. }