|
@@ -0,0 +1,114 @@
|
|
|
+from __future__ import unicode_literals
|
|
|
+
|
|
|
+import re
|
|
|
+import time
|
|
|
+
|
|
|
+from .common import InfoExtractor
|
|
|
+from ..utils import (
|
|
|
+ ExtractorError,
|
|
|
+ compat_urllib_request,
|
|
|
+ compat_urllib_parse,
|
|
|
+)
|
|
|
+
|
|
|
+
|
|
|
+class MooshareIE(InfoExtractor):
|
|
|
+ IE_NAME = 'mooshare'
|
|
|
+ IE_DESC = 'Mooshare.biz'
|
|
|
+ _VALID_URL = r'http://mooshare\.biz/(?P<id>[\da-z]{12})'
|
|
|
+
|
|
|
+ _TESTS = [
|
|
|
+ {
|
|
|
+ 'url': 'http://mooshare.biz/8dqtk4bjbp8g',
|
|
|
+ 'md5': '4e14f9562928aecd2e42c6f341c8feba',
|
|
|
+ 'info_dict': {
|
|
|
+ 'id': '8dqtk4bjbp8g',
|
|
|
+ 'ext': 'mp4',
|
|
|
+ 'title': 'Comedy Football 2011 - (part 1-2)',
|
|
|
+ 'duration': 893,
|
|
|
+ },
|
|
|
+ },
|
|
|
+ {
|
|
|
+ 'url': 'http://mooshare.biz/aipjtoc4g95j',
|
|
|
+ 'info_dict': {
|
|
|
+ 'id': 'aipjtoc4g95j',
|
|
|
+ 'ext': 'mp4',
|
|
|
+ 'title': 'Orange Caramel Dashing Through the Snow',
|
|
|
+ 'duration': 212,
|
|
|
+ },
|
|
|
+ 'params': {
|
|
|
+ # rtmp download
|
|
|
+ 'skip_download': True,
|
|
|
+ }
|
|
|
+ }
|
|
|
+ ]
|
|
|
+
|
|
|
+ def _real_extract(self, url):
|
|
|
+ mobj = re.match(self._VALID_URL, url)
|
|
|
+ video_id = mobj.group('id')
|
|
|
+
|
|
|
+ page = self._download_webpage(url, video_id, 'Downloading page')
|
|
|
+
|
|
|
+ if re.search(r'>Video Not Found or Deleted<', page) is not None:
|
|
|
+ raise ExtractorError(u'Video %s does not exist' % video_id, expected=True)
|
|
|
+
|
|
|
+ hash_key = self._html_search_regex(r'<input type="hidden" name="hash" value="([^"]+)">', page, 'hash')
|
|
|
+ title = self._html_search_regex(r'(?m)<div class="blockTitle">\s*<h2>Watch ([^<]+)</h2>', page, 'title')
|
|
|
+
|
|
|
+ download_form = {
|
|
|
+ 'op': 'download1',
|
|
|
+ 'id': video_id,
|
|
|
+ 'hash': hash_key,
|
|
|
+ }
|
|
|
+
|
|
|
+ request = compat_urllib_request.Request(
|
|
|
+ 'http://mooshare.biz/8dqtk4bjbp8g', compat_urllib_parse.urlencode(download_form))
|
|
|
+ request.add_header('Content-Type', 'application/x-www-form-urlencoded')
|
|
|
+
|
|
|
+ self.to_screen('%s: Waiting for timeout' % video_id)
|
|
|
+ time.sleep(5)
|
|
|
+
|
|
|
+ video_page = self._download_webpage(request, video_id, 'Downloading video page')
|
|
|
+
|
|
|
+ thumbnail = self._html_search_regex(r'image:\s*"([^"]+)",', video_page, 'thumbnail', fatal=False)
|
|
|
+ duration_str = self._html_search_regex(r'duration:\s*"(\d+)",', video_page, 'duration', fatal=False)
|
|
|
+ duration = int(duration_str) if duration_str is not None else None
|
|
|
+
|
|
|
+ formats = []
|
|
|
+
|
|
|
+ # SD video
|
|
|
+ mobj = re.search(r'(?m)file:\s*"(?P<url>[^"]+)",\s*provider:', video_page)
|
|
|
+ if mobj is not None:
|
|
|
+ formats.append({
|
|
|
+ 'url': mobj.group('url'),
|
|
|
+ 'format_id': 'sd',
|
|
|
+ 'format': 'SD',
|
|
|
+ })
|
|
|
+
|
|
|
+ # HD video
|
|
|
+ mobj = re.search(r'\'hd-2\': { file: \'(?P<url>[^\']+)\' },', video_page)
|
|
|
+ if mobj is not None:
|
|
|
+ formats.append({
|
|
|
+ 'url': mobj.group('url'),
|
|
|
+ 'format_id': 'hd',
|
|
|
+ 'format': 'HD',
|
|
|
+ })
|
|
|
+
|
|
|
+ # rtmp video
|
|
|
+ mobj = re.search(r'(?m)file: "(?P<playpath>[^"]+)",\s*streamer: "(?P<rtmpurl>rtmp://[^"]+)",', video_page)
|
|
|
+ if mobj is not None:
|
|
|
+ formats.append({
|
|
|
+ 'url': mobj.group('rtmpurl'),
|
|
|
+ 'play_path': mobj.group('playpath'),
|
|
|
+ 'rtmp_live': False,
|
|
|
+ 'ext': 'mp4',
|
|
|
+ 'format_id': 'rtmp',
|
|
|
+ 'format': 'HD',
|
|
|
+ })
|
|
|
+
|
|
|
+ return {
|
|
|
+ 'id': video_id,
|
|
|
+ 'title': title,
|
|
|
+ 'thumbnail': thumbnail,
|
|
|
+ 'duration': duration,
|
|
|
+ 'formats': formats,
|
|
|
+ }
|