|
@@ -1,56 +1,94 @@
|
|
from __future__ import unicode_literals
|
|
from __future__ import unicode_literals
|
|
|
|
|
|
-import re
|
|
|
|
|
|
+import json
|
|
|
|
|
|
from .common import InfoExtractor
|
|
from .common import InfoExtractor
|
|
|
|
+from ..compat import (
|
|
|
|
+ compat_urllib_request,
|
|
|
|
+)
|
|
from ..utils import (
|
|
from ..utils import (
|
|
- compat_urllib_parse,
|
|
|
|
-
|
|
|
|
- unified_strdate,
|
|
|
|
|
|
+ int_or_none,
|
|
)
|
|
)
|
|
|
|
|
|
|
|
|
|
class PornotubeIE(InfoExtractor):
|
|
class PornotubeIE(InfoExtractor):
|
|
- _VALID_URL = r'https?://(?:\w+\.)?pornotube\.com(/c/(?P<channel>[0-9]+))?(/m/(?P<videoid>[0-9]+))(/(?P<title>.+))$'
|
|
|
|
|
|
+ _VALID_URL = r'https?://(?:\w+\.)?pornotube\.com/(?:[^?#]*?)/video/(?P<id>[0-9]+)'
|
|
_TEST = {
|
|
_TEST = {
|
|
- 'url': 'http://pornotube.com/c/173/m/1689755/Marilyn-Monroe-Bathing',
|
|
|
|
- 'md5': '374dd6dcedd24234453b295209aa69b6',
|
|
|
|
|
|
+ 'url': 'http://www.pornotube.com/orientation/straight/video/4964/title/weird-hot-and-wet-science',
|
|
|
|
+ 'md5': '60fc5a4f0d93a97968fc7999d98260c9',
|
|
'info_dict': {
|
|
'info_dict': {
|
|
- 'id': '1689755',
|
|
|
|
- 'ext': 'flv',
|
|
|
|
- 'upload_date': '20090708',
|
|
|
|
- 'title': 'Marilyn-Monroe-Bathing',
|
|
|
|
- 'age_limit': 18
|
|
|
|
|
|
+ 'id': '4964',
|
|
|
|
+ 'ext': 'mp4',
|
|
|
|
+ 'upload_date': '20141203',
|
|
|
|
+ 'title': 'Weird Hot and Wet Science',
|
|
|
|
+ 'description': 'md5:a8304bef7ef06cb4ab476ca6029b01b0',
|
|
|
|
+ 'categories': ['Adult Humor', 'Blondes'],
|
|
|
|
+ 'uploader': 'Alpha Blue Archives',
|
|
|
|
+ 'thumbnail': 're:^https?://.*\\.jpg$',
|
|
|
|
+ 'timestamp': 1417582800,
|
|
|
|
+ 'age_limit': 18,
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
|
|
def _real_extract(self, url):
|
|
def _real_extract(self, url):
|
|
- mobj = re.match(self._VALID_URL, url)
|
|
|
|
|
|
+ video_id = self._match_id(url)
|
|
|
|
|
|
- video_id = mobj.group('videoid')
|
|
|
|
- video_title = mobj.group('title')
|
|
|
|
|
|
+ # Fetch origin token
|
|
|
|
+ js_config = self._download_webpage(
|
|
|
|
+ 'http://www.pornotube.com/assets/src/app/config.js', video_id,
|
|
|
|
+ note='Download JS config')
|
|
|
|
+ originAuthenticationSpaceKey = self._search_regex(
|
|
|
|
+ r"constant\('originAuthenticationSpaceKey',\s*'([^']+)'",
|
|
|
|
+ js_config, 'originAuthenticationSpaceKey')
|
|
|
|
+
|
|
|
|
+ # Fetch actual token
|
|
|
|
+ token_req_data = {
|
|
|
|
+ 'authenticationSpaceKey': originAuthenticationSpaceKey,
|
|
|
|
+ 'credentials': 'Clip Application',
|
|
|
|
+ }
|
|
|
|
+ token_req = compat_urllib_request.Request(
|
|
|
|
+ 'https://api.aebn.net/auth/v1/token/primal',
|
|
|
|
+ data=json.dumps(token_req_data).encode('utf-8'))
|
|
|
|
+ token_req.add_header('Content-Type', 'application/json')
|
|
|
|
+ token_req.add_header('Origin', 'http://www.pornotube.com')
|
|
|
|
+ token_answer = self._download_json(
|
|
|
|
+ token_req, video_id, note='Requesting primal token')
|
|
|
|
+ token = token_answer['tokenKey']
|
|
|
|
|
|
- # Get webpage content
|
|
|
|
- webpage = self._download_webpage(url, video_id)
|
|
|
|
|
|
+ # Get video URL
|
|
|
|
+ delivery_req = compat_urllib_request.Request(
|
|
|
|
+ 'https://api.aebn.net/delivery/v1/clips/%s/MP4' % video_id)
|
|
|
|
+ delivery_req.add_header('Authorization', token)
|
|
|
|
+ delivery_info = self._download_json(
|
|
|
|
+ delivery_req, video_id, note='Downloading delivery information')
|
|
|
|
+ video_url = delivery_info['mediaUrl']
|
|
|
|
|
|
- # Get the video URL
|
|
|
|
- VIDEO_URL_RE = r'url: "(?P<url>http://video[0-9].pornotube.com/.+\.flv)",'
|
|
|
|
- video_url = self._search_regex(VIDEO_URL_RE, webpage, 'video url')
|
|
|
|
- video_url = compat_urllib_parse.unquote(video_url)
|
|
|
|
|
|
+ # Get additional info (title etc.)
|
|
|
|
+ info_req = compat_urllib_request.Request(
|
|
|
|
+ 'https://api.aebn.net/content/v1/clips/%s?expand='
|
|
|
|
+ 'title,description,primaryImageNumber,startSecond,endSecond,'
|
|
|
|
+ 'movie.title,movie.MovieId,movie.boxCoverFront,movie.stars,'
|
|
|
|
+ 'movie.studios,stars.name,studios.name,categories.name,'
|
|
|
|
+ 'clipActive,movieActive,publishDate,orientations' % video_id)
|
|
|
|
+ info_req.add_header('Authorization', token)
|
|
|
|
+ info = self._download_json(
|
|
|
|
+ info_req, video_id, note='Downloading metadata')
|
|
|
|
|
|
- # Get the uploaded date
|
|
|
|
- VIDEO_UPLOADED_RE = r'<div class="video_added_by">Added (?P<date>[0-9\/]+) by'
|
|
|
|
- upload_date = self._html_search_regex(VIDEO_UPLOADED_RE, webpage, 'upload date', fatal=False)
|
|
|
|
- if upload_date:
|
|
|
|
- upload_date = unified_strdate(upload_date)
|
|
|
|
- age_limit = self._rta_search(webpage)
|
|
|
|
|
|
+ timestamp = int_or_none(info.get('publishDate'), scale=1000)
|
|
|
|
+ uploader = info.get('studios', [{}])[0].get('name')
|
|
|
|
+ movie_id = info['movie']['movieId']
|
|
|
|
+ thumbnail = 'http://pic.aebn.net/dis/t/%s/%s_%08d.jpg' % (
|
|
|
|
+ movie_id, movie_id, info['primaryImageNumber'])
|
|
|
|
+ categories = [c['name'] for c in info.get('categories')]
|
|
|
|
|
|
return {
|
|
return {
|
|
'id': video_id,
|
|
'id': video_id,
|
|
'url': video_url,
|
|
'url': video_url,
|
|
- 'upload_date': upload_date,
|
|
|
|
- 'title': video_title,
|
|
|
|
- 'ext': 'flv',
|
|
|
|
- 'format': 'flv',
|
|
|
|
- 'age_limit': age_limit,
|
|
|
|
|
|
+ 'title': info['title'],
|
|
|
|
+ 'description': info.get('description'),
|
|
|
|
+ 'timestamp': timestamp,
|
|
|
|
+ 'uploader': uploader,
|
|
|
|
+ 'thumbnail': thumbnail,
|
|
|
|
+ 'categories': categories,
|
|
|
|
+ 'age_limit': 18,
|
|
}
|
|
}
|