release 2013.10.23.2

[dailymotion] Extract all the available formats (closes #1028 )
[nowvideo] Fix key extraction
2013-10-23 18:38:09 +02:00 · 2013-10-23 17:33:38 +02:00 · 2013-10-23 17:00:33 +02:00 · 2013-10-23 16:32:17 +02:00 · 2013-10-23 16:31:53 +02:00 · 2013-10-23 15:12:33 +02:00
8 changed files with 79 additions and 30 deletions
--- a/youtube_dl/init.py
+++ b/youtube_dl/init.py
@@ -133,7 +133,7 @@ def parseOpts(overrideArguments=None):

    def _hide_login_info(opts):
        opts = list(opts)
-        for private_opt in ['-p', '--password', '-u', '--username']:
+        for private_opt in ['-p', '--password', '-u', '--username', '--video-password']:
            try:
                i = opts.index(private_opt)
                opts[i+1] = '<PRIVATE>'
--- a/youtube_dl/extractor/common.py
+++ b/youtube_dl/extractor/common.py
@@ -14,6 +14,7 @@ from ..utils import (
    clean_html,
    compiled_regex_type,
    ExtractorError,
+    RegexNotFoundError,
    unescapeHTML,
 )

@@ -231,7 +232,7 @@ class InfoExtractor(object):
        Perform a regex search on the given string, using a single or a list of
        patterns returning the first matching group.
        In case of failure return a default value or raise a WARNING or a
-        ExtractorError, depending on fatal, specifying the field name.
+        RegexNotFoundError, depending on fatal, specifying the field name.
        """
        if isinstance(pattern, (str, compat_str, compiled_regex_type)):
            mobj = re.search(pattern, string, flags)
@@ -251,7 +252,7 @@ class InfoExtractor(object):
        elif default is not None:
            return default
        elif fatal:
-            raise ExtractorError(u'Unable to extract %s' % _name)
+            raise RegexNotFoundError(u'Unable to extract %s' % _name)
        else:
            self._downloader.report_warning(u'unable to extract %s; '
                u'please report this issue on http://yt-dl.org/bug' % _name)
--- a/youtube_dl/extractor/dailymotion.py
+++ b/youtube_dl/extractor/dailymotion.py
@@ -28,6 +28,15 @@ class DailymotionIE(DailymotionBaseInfoExtractor, SubtitlesInfoExtractor):

    _VALID_URL = r'(?i)(?:https?://)?(?:www\.)?dailymotion\.[a-z]{2,3}/(?:embed/)?video/([^/]+)'
    IE_NAME = u'dailymotion'
+
+    _FORMATS = [
+        (u'stream_h264_ld_url', u'ld'),
+        (u'stream_h264_url', u'standard'),
+        (u'stream_h264_hq_url', u'hq'),
+        (u'stream_h264_hd_url', u'hd'),
+        (u'stream_h264_hd1080_url', u'hd180'),
+    ]
+
    _TESTS = [
        {
            u'url': u'http://www.dailymotion.com/video/x33vw9_tutoriel-de-youtubeur-dl-des-video_tech',
@@ -60,7 +69,6 @@ class DailymotionIE(DailymotionBaseInfoExtractor, SubtitlesInfoExtractor):

        video_id = mobj.group(1).split('_')[0].split('?')[0]

-        video_extension = 'mp4'
        url = 'http://www.dailymotion.com/video/%s' % video_id

        # Retrieve video webpage to extract further information
@@ -99,18 +107,24 @@ class DailymotionIE(DailymotionBaseInfoExtractor, SubtitlesInfoExtractor):
            msg = 'Couldn\'t get video, Dailymotion says: %s' % info['error']['title']
            raise ExtractorError(msg, expected=True)

-        # TODO: support choosing qualities
-
-        for key in ['stream_h264_hd1080_url','stream_h264_hd_url',
-                    'stream_h264_hq_url','stream_h264_url',
-                    'stream_h264_ld_url']:
-            if info.get(key):#key in info and info[key]:
-                max_quality = key
-                self.to_screen(u'Using %s' % key)
-                break
-        else:
+        formats = []
+        for (key, format_id) in self._FORMATS:
+            video_url = info.get(key)
+            if video_url is not None:
+                m_size = re.search(r'H264-(\d+)x(\d+)', video_url)
+                if m_size is not None:
+                    width, height = m_size.group(1), m_size.group(2)
+                else:
+                    width, height = None, None
+                formats.append({
+                    'url': video_url,
+                    'ext': 'mp4',
+                    'format_id': format_id,
+                    'width': width,
+                    'height': height,
+                })
+        if not formats:
            raise ExtractorError(u'Unable to extract video URL')
-        video_url = info[max_quality]

        # subtitles
        video_subtitles = self.extract_subtitles(video_id)
@@ -120,11 +134,10 @@ class DailymotionIE(DailymotionBaseInfoExtractor, SubtitlesInfoExtractor):

        return [{
            'id':       video_id,
-            'url':      video_url,
+            'formats': formats,
            'uploader': video_uploader,
            'upload_date':  video_upload_date,
            'title':    self._og_search_title(webpage),
-            'ext':      video_extension,
            'subtitles':    video_subtitles,
            'thumbnail': info['thumbnail_url']
        }]
--- a/youtube_dl/extractor/nowvideo.py
+++ b/youtube_dl/extractor/nowvideo.py
@@ -20,7 +20,10 @@ class NowVideoIE(InfoExtractor):

        video_id = mobj.group('id')
        webpage_url = 'http://www.nowvideo.ch/video/' + video_id
+        embed_url = 'http://embed.nowvideo.ch/embed.php?v=' + video_id
        webpage = self._download_webpage(webpage_url, video_id)
+        embed_page = self._download_webpage(embed_url, video_id,
+            u'Downloading embed page')

        self.report_extraction(video_id)

@@ -28,7 +31,7 @@ class NowVideoIE(InfoExtractor):
            webpage, u'video title')

        video_key = self._search_regex(r'var fkzd="(.*)";',
-            webpage, u'video key')
+            embed_page, u'video key')

        api_call = "http://www.nowvideo.ch/api/player.api.php?file={0}&numOfErrors=0&cid=1&key={1}".format(video_id, video_key)
        api_response = self._download_webpage(api_call, video_id,
--- a/youtube_dl/extractor/vimeo.py
+++ b/youtube_dl/extractor/vimeo.py
@@ -1,3 +1,4 @@
+# encoding: utf-8
 import json
 import re
 import itertools
@@ -10,6 +11,7 @@ from ..utils import (
    clean_html,
    get_element_by_attribute,
    ExtractorError,
+    RegexNotFoundError,
    std_headers,
    unsmuggle_url,
 )
@@ -25,7 +27,7 @@ class VimeoIE(InfoExtractor):
        {
            u'url': u'http://vimeo.com/56015672',
            u'file': u'56015672.mp4',
-            u'md5': u'8879b6cc097e987f02484baf890129e5',
+            u'md5': u'ae7a1d8b183758a0506b0622f37dfa14',
            u'info_dict': {
                u"upload_date": u"20121220", 
                u"description": u"This is a test case for youtube-dl.\nFor more information, see github.com/rg3/youtube-dl\nTest chars: \u2605 \" ' \u5e78 / \\ \u00e4 \u21ad \U0001d550", 
@@ -54,7 +56,22 @@ class VimeoIE(InfoExtractor):
                u'title': u'Kathy Sierra: Building the minimum Badass User, Business of Software',
                u'uploader': u'The BLN & Business of Software',
            },
-        }
+        },
+        {
+            u'url': u'http://vimeo.com/68375962',
+            u'file': u'68375962.mp4',
+            u'md5': u'aaf896bdb7ddd6476df50007a0ac0ae7',
+            u'note': u'Video protected with password',
+            u'info_dict': {
+                u'title': u'youtube-dl password protected test video',
+                u'upload_date': u'20130614',
+                u'uploader_id': u'user18948128',
+                u'uploader': u'Jaime Marquínez Ferrándiz',
+            },
+            u'params': {
+                u'videopassword': u'youtube-dl',
+            },
+        },
    ]

    def _login(self):
@@ -129,18 +146,26 @@ class VimeoIE(InfoExtractor):

        # Extract the config JSON
        try:
-            config = self._search_regex([r' = {config:({.+?}),assets:', r'c=({.+?);'],
-                webpage, u'info section', flags=re.DOTALL)
-            config = json.loads(config)
-        except:
+            try:
+                config_url = self._html_search_regex(
+                    r' data-config-url="(.+?)"', webpage, u'config URL')
+                config_json = self._download_webpage(config_url, video_id)
+                config = json.loads(config_json)
+            except RegexNotFoundError:
+                # For pro videos or player.vimeo.com urls
+                config = self._search_regex([r' = {config:({.+?}),assets:', r'c=({.+?);'],
+                    webpage, u'info section', flags=re.DOTALL)
+                config = json.loads(config)
+        except Exception as e:
            if re.search('The creator of this video has not given you permission to embed it on this domain.', webpage):
                raise ExtractorError(u'The author has restricted the access to this video, try with the "--referer" option')

-            if re.search('If so please provide the correct password.', webpage):
+            if re.search('<form[^>]+?id="pw_form"', webpage) is not None:
                self._verify_video_password(url, video_id, webpage)
                return self._real_extract(url)
            else:
-                raise ExtractorError(u'Unable to extract info section')
+                raise ExtractorError(u'Unable to extract info section',
+                                     cause=e)

        # Extract title
        video_title = config["video"]["title"]
--- a/youtube_dl/extractor/youtube.py
+++ b/youtube_dl/extractor/youtube.py
@@ -236,11 +236,13 @@ class YoutubeIE(YoutubeBaseInfoExtractor, SubtitlesInfoExtractor):
        '136': 'mp4',
        '137': 'mp4',
        '138': 'mp4',
-        '139': 'mp4',
-        '140': 'mp4',
-        '141': 'mp4',
        '160': 'mp4',

+        # Dash mp4 audio
+        '139': 'm4a',
+        '140': 'm4a',
+        '141': 'm4a',
+
        # Dash webm
        '171': 'webm',
        '172': 'webm',
--- a/youtube_dl/utils.py
+++ b/youtube_dl/utils.py
@@ -572,6 +572,11 @@ class ExtractorError(Exception):
        return u''.join(traceback.format_tb(self.traceback))


+class RegexNotFoundError(ExtractorError):
+    """Error when a regex didn't match"""
+    pass
+
+
 class DownloadError(Exception):
    """Download Error exception.

--- a/youtube_dl/version.py
+++ b/youtube_dl/version.py
@@ -1,2 +1,2 @@

-__version__ = '2013.10.23'
+__version__ = '2013.10.23.2'
Author	SHA1	Message	Date
Philipp Hagemeister	1cf64ee468	release 2013.10.23.2	2013-10-23 18:38:09 +02:00
Jaime Marquínez Ferrándiz	cdec0190c4	[dailymotion] Extract all the available formats (closes #1028 )	2013-10-23 17:33:38 +02:00
Jaime Marquínez Ferrándiz	2450bcb28b	[nowvideo] Fix key extraction Extract it from the embed page	2013-10-23 17:00:33 +02:00
Jaime Marquínez Ferrándiz	3126050c0f	Hide the video password on verbose mode	2013-10-23 16:32:17 +02:00
Jaime Marquínez Ferrándiz	93b22c7828	[vimeo] fix the extraction for videos protected with password Added a test video.	2013-10-23 16:31:53 +02:00
Philipp Hagemeister	0a89b2852e	release 2013.10.23.1	2013-10-23 15:12:33 +02:00
Jaime Marquínez Ferrándiz	55b3e45bba	[vimeo] Fix pro videos and player.vimeo.com urls The old process can still be used for those videos. Added RegexNotFoundError, which is raised by _search_regex if it can't extract the info.	2013-10-23 14:38:03 +02:00
Philipp Hagemeister	365bcf6d97	Merge remote-tracking branch 'origin/master'	2013-10-23 11:40:46 +02:00
Philipp Hagemeister	71907db3ba	[vimeo] Fix normal videos (Fixes #1642 ) Vimeo Pro Videos are still broken	2013-10-23 11:38:53 +02:00
Philipp Hagemeister	6803655ced	Merge pull request #1622 from rbrito/fix-extension extractor: youtube: Set extension of AAC audio formats to m4a.	2013-10-22 15:16:26 -07:00
Rogério Brito	f6f1fc9286	extractor: youtube: Fix extension of dash formats. While we are at it, separate the audio formats from the video formats. Signed-off-by: Rogério Brito <rbrito@ime.usp.br>	2013-10-18 18:53:00 -03:00
Rogério Brito	16f36a6fc9	extractor: youtube: Set extension of AAC audio formats to m4a. This, in particular, eases downloading both audio and videos in DASH formats before muxing them, which alleviates the problem that I exposed on issue Furthermore, one may argue that this is, indeed, the case for correctness's sake. Signed-off-by: Rogério Brito <rbrito@ime.usp.br>	2013-10-18 17:50:55 -03:00