2016-02-10 22:16:21 +01:00
# coding: utf-8
2016-08-25 22:22:31 +08:00
from __future__ import unicode_literals , division
2016-02-10 22:16:21 +01:00
from . common import InfoExtractor
from . . utils import int_or_none
class CrackleIE ( InfoExtractor ) :
2017-01-24 16:55:07 +01:00
_VALID_URL = r ' (?:crackle:|https?://(?:(?:www|m) \ .)?crackle \ .com/(?:playlist/ \ d+/|(?:[^/]+/)+))(?P<id> \ d+) '
2016-02-10 22:16:21 +01:00
_TEST = {
2016-08-25 22:22:31 +08:00
' url ' : ' http://www.crackle.com/comedians-in-cars-getting-coffee/2498934 ' ,
2016-02-10 22:16:21 +01:00
' info_dict ' : {
2016-08-25 22:22:31 +08:00
' id ' : ' 2498934 ' ,
2016-02-10 22:16:21 +01:00
' ext ' : ' mp4 ' ,
2016-08-25 22:22:31 +08:00
' title ' : ' Everybody Respects A Bloody Nose ' ,
' description ' : ' Jerry is kaffeeklatsching in L.A. with funnyman J.B. Smoove (Saturday Night Live, Real Husbands of Hollywood). They’ re headed for brew at 10 Speed Coffee in a 1964 Studebaker Avanti. ' ,
2017-01-02 20:08:07 +08:00
' thumbnail ' : r ' re:^https?://.* \ .jpg ' ,
2016-08-25 22:22:31 +08:00
' duration ' : 906 ,
' series ' : ' Comedians In Cars Getting Coffee ' ,
' season_number ' : 8 ,
' episode_number ' : 4 ,
' subtitles ' : {
' en-US ' : [ {
' ext ' : ' ttml ' ,
} ]
} ,
2016-02-10 22:16:21 +01:00
} ,
' params ' : {
# m3u8 download
' skip_download ' : True ,
}
}
2017-01-24 16:55:07 +01:00
_THUMBNAIL_RES = [
( 120 , 90 ) ,
( 208 , 156 ) ,
( 220 , 124 ) ,
( 220 , 220 ) ,
( 240 , 180 ) ,
( 250 , 141 ) ,
( 315 , 236 ) ,
( 320 , 180 ) ,
( 360 , 203 ) ,
( 400 , 300 ) ,
( 421 , 316 ) ,
( 460 , 330 ) ,
( 460 , 460 ) ,
( 462 , 260 ) ,
( 480 , 270 ) ,
( 587 , 330 ) ,
( 640 , 480 ) ,
( 700 , 330 ) ,
( 700 , 394 ) ,
( 854 , 480 ) ,
( 1024 , 1024 ) ,
( 1920 , 1080 ) ,
]
2016-02-10 22:16:21 +01:00
# extracted from http://legacyweb-us.crackle.com/flash/ReferrerRedirect.ashx
_MEDIA_FILE_SLOTS = {
' c544.flv ' : {
' width ' : 544 ,
' height ' : 306 ,
} ,
' 360p.mp4 ' : {
' width ' : 640 ,
' height ' : 360 ,
} ,
' 480p.mp4 ' : {
' width ' : 852 ,
' height ' : 478 ,
} ,
' 480p_1mbps.mp4 ' : {
' width ' : 852 ,
' height ' : 478 ,
} ,
}
def _real_extract ( self , url ) :
video_id = self . _match_id ( url )
2016-08-25 22:22:31 +08:00
config_doc = self . _download_xml (
' http://legacyweb-us.crackle.com/flash/QueryReferrer.ashx?site=16 ' ,
video_id , ' Downloading config ' )
2016-02-10 22:16:21 +01:00
item = self . _download_xml (
2016-02-10 22:23:56 +01:00
' http://legacyweb-us.crackle.com/app/revamp/vidwallcache.aspx?flags=-1&fm= %s ' % video_id ,
2017-01-24 16:55:07 +01:00
video_id , headers = self . geo_verification_headers ( ) ) . find ( ' i ' )
2016-02-10 22:16:21 +01:00
title = item . attrib [ ' t ' ]
subtitles = { }
2016-02-10 22:23:56 +01:00
formats = self . _extract_m3u8_formats (
2016-08-25 22:22:31 +08:00
' http://content.uplynk.com/ext/ %s / %s .m3u8 ' % ( config_doc . attrib [ ' strUplynkOwnerId ' ] , video_id ) ,
2016-02-10 22:39:33 +01:00
video_id , ' mp4 ' , m3u8_id = ' hls ' , fatal = None )
2017-01-24 16:55:07 +01:00
thumbnails = [ ]
2016-02-10 22:16:21 +01:00
path = item . attrib . get ( ' p ' )
if path :
2017-01-24 16:55:07 +01:00
for width , height in self . _THUMBNAIL_RES :
res = ' %d x %d ' % ( width , height )
thumbnails . append ( {
' id ' : res ,
' url ' : ' http://images-us-am.crackle.com/ %s tnl_ %s .jpg ' % ( path , res ) ,
' width ' : width ,
' height ' : height ,
' resolution ' : res ,
} )
2016-02-10 22:16:21 +01:00
http_base_url = ' http://ahttp.crackle.com/ ' + path
for mfs_path , mfs_info in self . _MEDIA_FILE_SLOTS . items ( ) :
formats . append ( {
' url ' : http_base_url + mfs_path ,
2016-02-10 22:39:33 +01:00
' format_id ' : ' http- ' + mfs_path . split ( ' . ' ) [ 0 ] ,
2016-02-10 22:16:21 +01:00
' width ' : mfs_info [ ' width ' ] ,
' height ' : mfs_info [ ' height ' ] ,
} )
for cc in item . findall ( ' cc ' ) :
locale = cc . attrib . get ( ' l ' )
v = cc . attrib . get ( ' v ' )
if locale and v :
if locale not in subtitles :
subtitles [ locale ] = [ ]
2017-01-24 16:55:07 +01:00
for url_ext , ext in ( ( ' vtt ' , ' vtt ' ) , ( ' xml ' , ' tt ' ) ) :
subtitles . setdefault ( locale , [ ] ) . append ( {
' url ' : ' %s / %s %s _ %s . %s ' % ( config_doc . attrib [ ' strSubtitleServer ' ] , path , locale , v , url_ext ) ,
' ext ' : ext ,
} )
2016-02-10 22:23:56 +01:00
self . _sort_formats ( formats , ( ' width ' , ' height ' , ' tbr ' , ' format_id ' ) )
2016-02-10 22:16:21 +01:00
return {
' id ' : video_id ,
' title ' : title ,
' description ' : item . attrib . get ( ' d ' ) ,
2016-08-25 22:22:31 +08:00
' duration ' : int ( item . attrib . get ( ' r ' ) , 16 ) / 1000 if item . attrib . get ( ' r ' ) else None ,
2016-02-10 22:16:21 +01:00
' series ' : item . attrib . get ( ' sn ' ) ,
' season_number ' : int_or_none ( item . attrib . get ( ' se ' ) ) ,
' episode_number ' : int_or_none ( item . attrib . get ( ' ep ' ) ) ,
2017-01-24 16:55:07 +01:00
' thumbnails ' : thumbnails ,
2016-02-10 22:16:21 +01:00
' subtitles ' : subtitles ,
' formats ' : formats ,
}