daum.py 3.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102
  1. # encoding: utf-8
  2. from __future__ import unicode_literals
  3. from .common import InfoExtractor
  4. from ..compat import compat_urllib_parse
  5. from ..utils import int_or_none
  6. class DaumIE(InfoExtractor):
  7. _VALID_URL = r'https?://(?:m\.)?tvpot\.daum\.net/v/(?P<id>[^?#&]+)'
  8. IE_NAME = 'daum.net'
  9. _TESTS = [{
  10. 'url': 'http://tvpot.daum.net/v/vab4dyeDBysyBssyukBUjBz',
  11. 'info_dict': {
  12. 'id': 'vab4dyeDBysyBssyukBUjBz',
  13. 'ext': 'mp4',
  14. 'title': '마크 헌트 vs 안토니오 실바',
  15. 'description': 'Mark Hunt vs Antonio Silva',
  16. 'upload_date': '20131217',
  17. 'duration': 2117,
  18. },
  19. }, {
  20. 'url': 'http://tvpot.daum.net/v/07dXWRka62Y%24',
  21. 'only_matching': True,
  22. }]
  23. def _real_extract(self, url):
  24. video_id = self._match_id(url)
  25. query = compat_urllib_parse.urlencode({'vid': video_id})
  26. info = self._download_xml(
  27. 'http://tvpot.daum.net/clip/ClipInfoXml.do?' + query, video_id,
  28. 'Downloading video info')
  29. movie_data = self._download_json(
  30. 'http://videofarm.daum.net/controller/api/closed/v1_2/IntegratedMovieData.json?' + query,
  31. video_id, 'Downloading video formats info')
  32. formats = []
  33. for format_el in movie_data['output_list']['output_list']:
  34. profile = format_el['profile']
  35. format_query = compat_urllib_parse.urlencode({
  36. 'vid': video_id,
  37. 'profile': profile,
  38. })
  39. url_doc = self._download_xml(
  40. 'http://videofarm.daum.net/controller/api/open/v1_2/MovieLocation.apixml?' + format_query,
  41. video_id, note='Downloading video data for %s format' % profile)
  42. format_url = url_doc.find('result/url').text
  43. formats.append({
  44. 'url': format_url,
  45. 'format_id': profile,
  46. 'width': int_or_none(format_el.get('width')),
  47. 'height': int_or_none(format_el.get('height')),
  48. 'filesize': int_or_none(format_el.get('filesize')),
  49. })
  50. self._sort_formats(formats)
  51. return {
  52. 'id': video_id,
  53. 'title': info.find('TITLE').text,
  54. 'formats': formats,
  55. 'thumbnail': info.find('THUMB_URL').text,
  56. 'description': info.find('CONTENTS').text,
  57. 'duration': int_or_none(info.find('DURATION').text),
  58. 'upload_date': info.find('REGDTTM').text[:8],
  59. }
  60. class DaumClipIE(InfoExtractor):
  61. _VALID_URL = r'https?://(?:m\.)?tvpot\.daum\.net/.*?clipid=(?P<id>\d+)'
  62. IE_NAME = 'daum.net'
  63. _TESTS = [{
  64. 'url': 'http://tvpot.daum.net/clip/ClipView.do?clipid=52554690',
  65. 'info_dict': {
  66. 'id': '52554690',
  67. 'ext': 'mp4',
  68. 'title': 'DOTA 2GETHER 시즌2 6회 - 2부',
  69. 'description': 'DOTA 2GETHER 시즌2 6회 - 2부',
  70. 'upload_date': '20130831',
  71. 'duration': 3868,
  72. 'view_count': int,
  73. },
  74. }]
  75. def _real_extract(self, url):
  76. video_id = self._match_id(url)
  77. clip_info = self._download_json('http://tvpot.daum.net/mypot/json/GetClipInfo.do?clipid=%s' % video_id, video_id)['clip_bean']
  78. return {
  79. '_type': 'url_transparent',
  80. 'id': video_id,
  81. 'url': 'http://tvpot.daum.net/v/%s' % clip_info['vid'],
  82. 'title': clip_info['title'],
  83. 'thumbnail': clip_info.get('thumb_url'),
  84. 'description': clip_info.get('contents'),
  85. 'duration': int_or_none(clip_info.get('duration')),
  86. 'upload_date': clip_info.get('up_date')[:8],
  87. 'view_count': int_or_none(clip_info.get('play_count')),
  88. 'ie_key': 'Daum',
  89. }