release 2014.02.03.1

[generic] Add support for multiple brightcove URLs (Fixes #2283 )
[vimeo] Remove superfluous whitespace
2014-02-03 15:20:41 +01:00 · 2014-02-03 15:19:40 +01:00 · 2014-02-03 20:24:11 +07:00 · 2014-02-03 20:19:23 +07:00 · 2014-02-03 20:02:58 +07:00
6 changed files with 126 additions and 20 deletions
--- a/test/test_playlists.py
+++ b/test/test_playlists.py
@ -34,6 +34,7 @@ from youtube_dl.extractor import (
    KhanAcademyIE,
    EveryonesMixtapeIE,
    RutubeChannelIE,
+    GenericIE,
 )


@ -229,6 +230,16 @@ class TestPlaylists(unittest.TestCase):
        self.assertEqual(result['id'], '1409')
        self.assertTrue(len(result['entries']) >= 34)

+    def test_multiple_brightcove_videos(self):
+        # https://github.com/rg3/youtube-dl/issues/2283
+        dl = FakeYDL()
+        ie = GenericIE(dl)
+        result = ie.extract('http://www.newyorker.com/online/blogs/newsdesk/2014/01/always-never-nuclear-command-and-control.html')
+        self.assertIsPlaylist(result)
+        self.assertEqual(result['id'], 'always-never-nuclear-command-and-control')
+        self.assertEqual(result['title'], 'Always/Never: A Little-Seen Movie About Nuclear Command and Control : The New Yorker')
+        self.assertEqual(len(result['entries']), 3)
+

 if __name__ == '__main__':
    unittest.main()
--- a/test/test_subtitles.py
+++ b/test/test_subtitles.py
@ -14,6 +14,7 @@ from youtube_dl.extractor import (
    YoutubeIE,
    DailymotionIE,
    TEDIE,
+    VimeoIE,
 )


@ -223,5 +224,60 @@ class TestBlipTVSubtitles(BaseTestSubtitles):
        self.assertEqual(md5(subtitles['en']), '5b75c300af65fe4476dff79478bb93e4')


+class TestVimeoSubtitles(BaseTestSubtitles):
+    url = 'http://vimeo.com/76979871'
+    IE = VimeoIE
+
+    def test_no_writesubtitles(self):
+        subtitles = self.getSubtitles()
+        self.assertEqual(subtitles, None)
+
+    def test_subtitles(self):
+        self.DL.params['writesubtitles'] = True
+        subtitles = self.getSubtitles()
+        self.assertEqual(md5(subtitles['en']), '8062383cf4dec168fc40a088aa6d5888')
+
+    def test_subtitles_lang(self):
+        self.DL.params['writesubtitles'] = True
+        self.DL.params['subtitleslangs'] = ['fr']
+        subtitles = self.getSubtitles()
+        self.assertEqual(md5(subtitles['fr']), 'b6191146a6c5d3a452244d853fde6dc8')
+
+    def test_allsubtitles(self):
+        self.DL.params['writesubtitles'] = True
+        self.DL.params['allsubtitles'] = True
+        subtitles = self.getSubtitles()
+        self.assertEqual(set(subtitles.keys()), set(['de', 'en', 'es', 'fr']))
+
+    def test_list_subtitles(self):
+        self.DL.expect_warning(u'Automatic Captions not supported by this server')
+        self.DL.params['listsubtitles'] = True
+        info_dict = self.getInfoDict()
+        self.assertEqual(info_dict, None)
+
+    def test_automatic_captions(self):
+        self.DL.expect_warning(u'Automatic Captions not supported by this server')
+        self.DL.params['writeautomaticsub'] = True
+        self.DL.params['subtitleslang'] = ['en']
+        subtitles = self.getSubtitles()
+        self.assertTrue(len(subtitles.keys()) == 0)
+
+    def test_nosubtitles(self):
+        self.DL.expect_warning(u'video doesn\'t have subtitles')
+        self.url = 'http://vimeo.com/56015672'
+        self.DL.params['writesubtitles'] = True
+        self.DL.params['allsubtitles'] = True
+        subtitles = self.getSubtitles()
+        self.assertEqual(len(subtitles), 0)
+
+    def test_multiple_langs(self):
+        self.DL.params['writesubtitles'] = True
+        langs = ['es', 'fr', 'de']
+        self.DL.params['subtitleslangs'] = langs
+        subtitles = self.getSubtitles()
+        for lang in langs:
+            self.assertTrue(subtitles.get(lang) is not None, u'Subtitles for \'%s\' not extracted' % lang)
+
+
 if __name__ == '__main__':
    unittest.main()
--- a/youtube_dl/extractor/brightcove.py
+++ b/youtube_dl/extractor/brightcove.py
@ -127,25 +127,28 @@ class BrightcoveIE(InfoExtractor):

    @classmethod
    def _extract_brightcove_url(cls, webpage):
-        """Try to extract the brightcove url from the wepbage, returns None
+        """Try to extract the brightcove url from the webpage, returns None
        if it can't be found
        """
+        urls = cls._extract_brightcove_urls(webpage)
+        return urls[0] if urls else None
+
+    @classmethod
+    def _extract_brightcove_urls(cls, webpage):
+        """Return a list of all Brightcove URLs from the webpage """

        url_m = re.search(r'<meta\s+property="og:video"\s+content="(http://c.brightcove.com/[^"]+)"', webpage)
        if url_m:
-            return url_m.group(1)
+            return [url_m.group(1)]

-        m_brightcove = re.search(
+        matches = re.findall(
            r'''(?sx)<object
            (?:
-                [^>]+?class=([\'"])[^>]*?BrightcoveExperience.*?\1 |
+                [^>]+?class=[\'"][^>]*?BrightcoveExperience.*?[\'"] |
                [^>]*?>\s*<param\s+name="movie"\s+value="https?://[^/]*brightcove\.com/
            ).+?</object>''',
            webpage)
-        if m_brightcove is not None:
-            return cls._build_brighcove_url(m_brightcove.group())
-        else:
-            return None
+        return [cls._build_brighcove_url(m) for m in matches]

    def _real_extract(self, url):
        url, smuggled_data = unsmuggle_url(url, {})
--- a/youtube_dl/extractor/generic.py
+++ b/youtube_dl/extractor/generic.py
@ -234,11 +234,21 @@ class GenericIE(InfoExtractor):
            r'^(?:https?://)?([^/]*)/.*', url, 'video uploader')

        # Look for BrightCove:
-        bc_url = BrightcoveIE._extract_brightcove_url(webpage)
-        if bc_url is not None:
+        bc_urls = BrightcoveIE._extract_brightcove_urls(webpage)
+        if bc_urls:
            self.to_screen('Brightcove video detected.')
-            surl = smuggle_url(bc_url, {'Referer': url})
-            return self.url_result(surl, 'Brightcove')
+            entries = [{
+                '_type': 'url',
+                'url': smuggle_url(bc_url, {'Referer': url}),
+                'ie_key': 'Brightcove'
+            } for bc_url in bc_urls]
+
+            return {
+                '_type': 'playlist',
+                'title': video_title,
+                'id': video_id,
+                'entries': entries,
+            }

        # Look for embedded (iframe) Vimeo player
        mobj = re.search(
--- a/youtube_dl/extractor/vimeo.py
+++ b/youtube_dl/extractor/vimeo.py
@ -6,10 +6,10 @@ import re
 import itertools

 from .common import InfoExtractor
+from .subtitles import SubtitlesInfoExtractor
 from ..utils import (
    compat_urllib_parse,
    compat_urllib_request,
-
    clean_html,
    get_element_by_attribute,
    ExtractorError,
@ -19,7 +19,7 @@ from ..utils import (
 )


-class VimeoIE(InfoExtractor):
+class VimeoIE(SubtitlesInfoExtractor):
    """Information extractor for vimeo.com."""

    # _VALID_URL matches Vimeo URLs
@ -84,6 +84,20 @@ class VimeoIE(InfoExtractor):
                'videopassword': 'youtube-dl',
            },
        },
+        {
+            'url': 'http://vimeo.com/76979871',
+            'md5': '3363dd6ffebe3784d56f4132317fd446',
+            'note': 'Video with subtitles',
+            'info_dict': {
+                'id': '76979871',
+                'ext': 'mp4',
+                'title': 'The New Vimeo Player (You Know, For Videos)',
+                'description': 'md5:2ec900bf97c3f389378a96aee11260ea',
+                'upload_date': '20131015',
+                'uploader_id': 'staff',
+                'uploader': 'Vimeo Staff',
+            }
+        },
    ]

    def _login(self):
@ -273,19 +287,31 @@ class VimeoIE(InfoExtractor):
        if len(formats) == 0:
            raise ExtractorError('No known codec found')

+        subtitles = {}
+        text_tracks = config['request'].get('text_tracks')
+        if text_tracks:
+            for tt in text_tracks:
+                subtitles[tt['lang']] = 'http://vimeo.com' + tt['url']
+
+        video_subtitles = self.extract_subtitles(video_id, subtitles)
+        if self._downloader.params.get('listsubtitles', False):
+            self._list_available_subtitles(video_id, subtitles)
+            return
+
        return {
-            'id':       video_id,
+            'id': video_id,
            'uploader': video_uploader,
            'uploader_id': video_uploader_id,
-            'upload_date':  video_upload_date,
-            'title':    video_title,
-            'thumbnail':    video_thumbnail,
-            'description':  video_description,
+            'upload_date': video_upload_date,
+            'title': video_title,
+            'thumbnail': video_thumbnail,
+            'description': video_description,
            'formats': formats,
            'webpage_url': url,
            'view_count': view_count,
            'like_count': like_count,
            'comment_count': comment_count,
+            'subtitles': video_subtitles,
        }


--- a/youtube_dl/version.py
+++ b/youtube_dl/version.py
@ -1,2 +1,2 @@

-__version__ = '2014.02.03'
+__version__ = '2014.02.03.1'
Author	SHA1	Message	Date
Philipp Hagemeister	90159f5561	release 2014.02.03.1	2014-02-03 15:20:41 +01:00
Philipp Hagemeister	99877772d0	[generic] Add support for multiple brightcove URLs (Fixes #2283 )	2014-02-03 15:19:40 +01:00
Sergey M.	b0268cb6ce	[vimeo] Remove superfluous whitespace	2014-02-03 20:24:11 +07:00
Sergey M.	4edff4cfa8	[vimeo] Add subtitle tests	2014-02-03 20:19:23 +07:00
Sergey M.	1eac553e7e	[vimeo] Add support for subtitles (Closes #2239 )	2014-02-03 20:02:58 +07:00