release 2015.11.02

[utils] unified_strdate: Return None if the date format can't be recognized (fixes #7340 )
This issue was introduced with ae12bc3ebb, it returned 'None'.
2015-11-02 16:18:54 +01:00 · 2015-11-02 14:08:38 +01:00 · 2015-11-02 13:55:21 +01:00 · 2015-11-02 12:46:10 +01:00 · 2015-11-02 04:26:20 +06:00
5 changed files with 32 additions and 24 deletions
--- a/test/test_utils.py
+++ b/test/test_utils.py
@@ -236,6 +236,7 @@ class TestUtil(unittest.TestCase):
            unified_strdate('2/2/2015 6:47:40 PM', day_first=False),
            '20150202')
        self.assertEqual(unified_strdate('25-09-2014'), '20140925')
+        self.assertEqual(unified_strdate('UNKNOWN DATE FORMAT'), None)

    def test_find_xpath_attr(self):
        testxml = '''<root>
--- a/youtube_dl/extractor/mitele.py
+++ b/youtube_dl/extractor/mitele.py
@@ -1,7 +1,10 @@
 from __future__ import unicode_literals

 from .common import InfoExtractor
-from ..compat import compat_urllib_parse
+from ..compat import (
+    compat_urllib_parse,
+    compat_urlparse,
+)
 from ..utils import (
    encode_dict,
    get_element_by_attribute,
@@ -15,7 +18,7 @@ class MiTeleIE(InfoExtractor):

    _TESTS = [{
        'url': 'http://www.mitele.es/programas-tv/diario-de/la-redaccion/programa-144/',
-        'md5': '757b0b66cbd7e0a97226d7d3156cb3e9',
+        'md5': '0ff1a13aebb35d9bc14081ff633dd324',
        'info_dict': {
            'id': '0NF1jJnxS1Wu3pHrmvFyw2',
            'display_id': 'programa-144',
@@ -34,6 +37,7 @@ class MiTeleIE(InfoExtractor):

        config_url = self._search_regex(
            r'data-config\s*=\s*"([^"]+)"', webpage, 'data config url')
+        config_url = compat_urlparse.urljoin(url, config_url)

        config = self._download_json(
            config_url, display_id, 'Downloading config JSON')
--- a/youtube_dl/extractor/videofyme.py
+++ b/youtube_dl/extractor/videofyme.py
@@ -2,8 +2,8 @@ from __future__ import unicode_literals

 from .common import InfoExtractor
 from ..utils import (
-    find_xpath_attr,
    int_or_none,
+    parse_iso8601,
 )


@@ -18,33 +18,35 @@ class VideofyMeIE(InfoExtractor):
            'id': '1100701',
            'ext': 'mp4',
            'title': 'This is VideofyMe',
-            'description': None,
+            'description': '',
+            'upload_date': '20130326',
+            'timestamp': 1364288959,
            'uploader': 'VideofyMe',
            'uploader_id': 'thisisvideofyme',
            'view_count': int,
+            'likes': int,
+            'comment_count': int,
        },
-
    }

    def _real_extract(self, url):
        video_id = self._match_id(url)
-        config = self._download_xml('http://sunshine.videofy.me/?videoId=%s' % video_id,
-                                    video_id)
-        video = config.find('video')
-        sources = video.find('sources')
-        url_node = next(node for node in [find_xpath_attr(sources, 'source', 'id', 'HQ %s' % key)
-                                          for key in ['on', 'av', 'off']] if node is not None)
-        video_url = url_node.find('url').text
-        view_count = int_or_none(self._search_regex(
-            r'([0-9]+)', video.find('views').text, 'view count', fatal=False))
+
+        config = self._download_json('http://vf-player-info-loader.herokuapp.com/%s.json' % video_id, video_id)['videoinfo']
+
+        video = config.get('video')
+        blog = config.get('blog', {})

        return {
            'id': video_id,
-            'title': video.find('title').text,
-            'url': video_url,
-            'thumbnail': video.find('thumb').text,
-            'description': video.find('description').text,
-            'uploader': config.find('blog/name').text,
-            'uploader_id': video.find('identifier').text,
-            'view_count': view_count,
+            'title': video['title'],
+            'url': video['sources']['source']['url'],
+            'thumbnail': video.get('thumb'),
+            'description': video.get('description'),
+            'timestamp': parse_iso8601(video.get('date')),
+            'uploader': blog.get('name'),
+            'uploader_id': blog.get('identifier'),
+            'view_count': int_or_none(self._search_regex(r'([0-9]+)', video.get('views'), 'view count', fatal=False)),
+            'likes': int_or_none(video.get('likes')),
+            'comment_count': int_or_none(video.get('nrOfComments')),
        }
--- a/youtube_dl/utils.py
+++ b/youtube_dl/utils.py
@@ -366,7 +366,7 @@ def sanitize_path(s):
    if drive_or_unc:
        norm_path.pop(0)
    sanitized_path = [
-        path_part if path_part in ['.', '..'] else re.sub('(?:[/<>:"\\|\\\\?\\*]|\.$)', '#', path_part)
+        path_part if path_part in ['.', '..'] else re.sub('(?:[/<>:"\\|\\\\?\\*]|[\s.]$)', '#', path_part)
        for path_part in norm_path]
    if drive_or_unc:
        sanitized_path.insert(0, drive_or_unc + os.path.sep)
@@ -911,7 +911,8 @@ def unified_strdate(date_str, day_first=True):
        timetuple = email.utils.parsedate_tz(date_str)
        if timetuple:
            upload_date = datetime.datetime(*timetuple[:6]).strftime('%Y%m%d')
-    return compat_str(upload_date)
+    if upload_date is not None:
+        return compat_str(upload_date)


 def determine_ext(url, default_ext='unknown_video'):
--- a/youtube_dl/version.py
+++ b/youtube_dl/version.py
@@ -1,3 +1,3 @@
 from __future__ import unicode_literals

-__version__ = '2015.11.01'
+__version__ = '2015.11.02'
Author	SHA1	Message	Date
Philipp Hagemeister	a230068ff7	release 2015.11.02	2015-11-02 16:18:54 +01:00
Jaime Marquínez Ferrándiz	6a75040278	[utils] unified_strdate: Return None if the date format can't be recognized (fixes #7340 ) This issue was introduced with `ae12bc3ebb`, it returned 'None'.	2015-11-02 14:08:38 +01:00
remitamine	c514b0ec65	[videofy.me] fix info extraction Closes #7339.	2015-11-02 13:55:21 +01:00
Jaime Marquínez Ferrándiz	eb97f46e8b	[mitele] Fix extraction and update test checksum (fixes #7343 )	2015-11-02 12:46:10 +01:00
Sergey M․	c90d16cf36	[utils:sanitize_path] Disallow trailing whitespace in path segment (Closes #7332 )	2015-11-02 04:26:20 +06:00