11 years ago · 4349c07dd7
--- a/test/test_utils.py
+++ b/test/test_utils.py
@@ -376,6 +376,7 @@ class TestUtil(unittest.TestCase):
 
															         self.assertEqual(parse_filesize('2 MiB'), 2097152)
														
 
															         self.assertEqual(parse_filesize('5 GB'), 5000000000)
														
 
															         self.assertEqual(parse_filesize('1.2Tb'), 1200000000000)
														
 
															+        self.assertEqual(parse_filesize('1,24 KB'), 1240)
														
 
															 if __name__ == '__main__':
														
 
															     unittest.main()
														
--- a/youtube_dl/extractor/__init__.py
+++ b/youtube_dl/extractor/__init__.py
@@ -217,6 +217,7 @@ from .mdr import MDRIE
 
															 from .metacafe import MetacafeIE
														
 
															 from .metacritic import MetacriticIE
														
 
															 from .mgoon import MgoonIE
														
 
															+from .minhateca import MinhatecaIE
														
 
															 from .ministrygrid import MinistryGridIE
														
 
															 from .mit import TechTVMITIE, MITIE, OCWMITIE
														
 
															 from .mitele import MiTeleIE
														
--- a/youtube_dl/extractor/minhateca.py
+++ b/youtube_dl/extractor/minhateca.py
@@ -0,0 +1,71 @@
 
															+# coding: utf-8
														
 
															+from __future__ import unicode_literals
														
 
															+
														
 
															+from .common import InfoExtractor
														
 
															+from ..compat import (
														
 
															+    compat_urllib_parse,
														
 
															+    compat_urllib_request,
														
 
															+)
														
 
															+from ..utils import (
														
 
															+    int_or_none,
														
 
															+    parse_filesize,
														
 
															+)
														
 
															+
														
 
															+
														
 
															+class MinhatecaIE(InfoExtractor):
														
 
															+    _VALID_URL = r'https?://minhateca\.com\.br/[^?#]+,(?P<id>[0-9]+)\.'
														
 
															+    _TEST = {
														
 
															+        'url': 'http://minhateca.com.br/pereba/misc/youtube-dl+test+video,125848331.mp4(video)',
														
 
															+        'info_dict': {
														
 
															+            'id': '125848331',
														
 
															+            'ext': 'mp4',
														
 
															+            'title': 'youtube-dl test video',
														
 
															+            'thumbnail': 're:^https?://.*\.jpg$',
														
 
															+            'filesize_approx': 1530000,
														
 
															+            'duration': 9,
														
 
															+            'view_count': int,
														
 
															+        }
														
 
															+    }
														
 
															+
														
 
															+    def _real_extract(self, url):
														
 
															+        video_id = self._match_id(url)
														
 
															+        webpage = self._download_webpage(url, video_id)
														
 
															+
														
 
															+        token = self._html_search_regex(
														
 
															+            r'<input name="__RequestVerificationToken".*?value="([^"]+)"',
														
 
															+            webpage, 'request token')
														
 
															+        token_data = [
														
 
															+            ('fileId', video_id),
														
 
															+            ('__RequestVerificationToken', token),
														
 
															+        ]
														
 
															+        req = compat_urllib_request.Request(
														
 
															+            'http://minhateca.com.br/action/License/Download',
														
 
															+            data=compat_urllib_parse.urlencode(token_data))
														
 
															+        req.add_header('Content-Type', 'application/x-www-form-urlencoded')
														
 
															+        data = self._download_json(
														
 
															+            req, video_id, note='Downloading metadata')
														
 
															+
														
 
															+        video_url = data['redirectUrl']
														
 
															+        title_str = self._html_search_regex(
														
 
															+            r'<h1.*?>(.*?)</h1>', webpage, 'title')
														
 
															+        title, _, ext = title_str.rpartition('.')
														
 
															+        filesize_approx = parse_filesize(self._html_search_regex(
														
 
															+            r'<p class="fileSize">(.*?)</p>',
														
 
															+            webpage, 'file size approximation', fatal=False))
														
 
															+        duration = int_or_none(self._html_search_regex(
														
 
															+            r'(?s)<p class="fileLeng[ht][th]">.*?([0-9]+)\s*s',
														
 
															+            webpage, 'duration', fatal=False))
														
 
															+        view_count = int_or_none(self._html_search_regex(
														
 
															+            r'<p class="downloadsCounter">([0-9]+)</p>',
														
 
															+            webpage, 'view count', fatal=False))
														
 
															+
														
 
															+        return {
														
 
															+            'id': video_id,
														
 
															+            'url': video_url,
														
 
															+            'title': title,
														
 
															+            'ext': ext,
														
 
															+            'filesize_approx': filesize_approx,
														
 
															+            'duration': duration,
														
 
															+            'view_count': view_count,
														
 
															+            'thumbnail': self._og_search_thumbnail(webpage),
														
 
															+        }
														
--- a/youtube_dl/utils.py
+++ b/youtube_dl/utils.py
@@ -1090,11 +1090,14 @@ def parse_filesize(s):
 
															     }
														
 
															     units_re = '|'.join(re.escape(u) for u in _UNIT_TABLE)
														
 
															-    m = re.match(r'(?P<num>[0-9]+(?:\.[0-9]*)?)\s*(?P<unit>%s)' % units_re, s)
														
 
															+    m = re.match(
														
 
															+        r'(?P<num>[0-9]+(?:[,.][0-9]*)?)\s*(?P<unit>%s)' % units_re, s)
														
 
															     if not m:
														
 
															         return None
														
 
															-    return int(float(m.group('num')) * _UNIT_TABLE[m.group('unit')])
														
 
															+    num_str = m.group('num').replace(',', '.')
														
 
															+    mult = _UNIT_TABLE[m.group('unit')]
														
 
															+    return int(float(num_str) * mult)
														
 
															 def get_term_width():