2014-04-03 07:21:21 -07:00
# coding: utf-8
from __future__ import unicode_literals
import json
from . common import InfoExtractor
2015-09-23 05:28:05 -07:00
from . theplatform import ThePlatformIE
2014-04-03 07:21:21 -07:00
class CNETIE ( InfoExtractor ) :
_VALID_URL = r ' https?://(?:www \ .)?cnet \ .com/videos/(?P<id>[^/]+)/ '
2015-06-07 22:32:04 -07:00
_TESTS = [ {
2014-04-03 07:21:21 -07:00
' url ' : ' http://www.cnet.com/videos/hands-on-with-microsofts-windows-8-1-update/ ' ,
' info_dict ' : {
' id ' : ' 56f4ea68-bd21-4852-b08c-4de5b8354c60 ' ,
2015-09-23 05:28:05 -07:00
' ext ' : ' mp4 ' ,
2014-04-03 07:21:21 -07:00
' title ' : ' Hands-on with Microsoft Windows 8.1 Update ' ,
' description ' : ' The new update to the Windows 8 OS brings improved performance for mouse and keyboard users. ' ,
2014-12-12 06:55:55 -08:00
' uploader_id ' : ' 6085384d-619e-11e3-b231-14feb5ca9861 ' ,
2014-04-03 07:21:21 -07:00
' uploader ' : ' Sarah Mitroff ' ,
2014-12-12 06:55:55 -08:00
} ,
2015-06-07 22:32:04 -07:00
} , {
' url ' : ' http://www.cnet.com/videos/whiny-pothole-tweets-at-local-government-when-hit-by-cars-tomorrow-daily-187/ ' ,
' info_dict ' : {
' id ' : ' 56527b93-d25d-44e3-b738-f989ce2e49ba ' ,
2015-09-23 05:28:05 -07:00
' ext ' : ' mp4 ' ,
2015-06-07 22:32:04 -07:00
' description ' : ' Khail and Ashley wonder what other civic woes can be solved by self-tweeting objects, investigate a new kind of VR camera and watch an origami robot self-assemble, walk, climb, dig and dissolve. #TDPothole ' ,
' uploader_id ' : ' b163284d-6b73-44fc-b3e6-3da66c392d40 ' ,
' uploader ' : ' Ashley Esqueda ' ,
' title ' : ' Whiny potholes tweet at local government when hit by cars (Tomorrow Daily 187) ' ,
} ,
} ]
2014-04-03 07:21:21 -07:00
def _real_extract ( self , url ) :
2014-12-12 06:55:55 -08:00
display_id = self . _match_id ( url )
2014-04-03 07:21:21 -07:00
webpage = self . _download_webpage ( url , display_id )
2014-12-12 06:55:55 -08:00
2014-04-03 07:21:21 -07:00
data_json = self . _html_search_regex (
2015-09-23 05:28:05 -07:00
r " <div class= \" videoPlayer \" \ s+.*?data-cnet-video-uvp-options= ' ([^ ' ]+) ' " ,
2014-04-03 07:21:21 -07:00
webpage , ' data json ' )
data = json . loads ( data_json )
2015-09-23 05:28:05 -07:00
vdata = data [ ' videos ' ] [ 0 ]
2014-12-12 06:55:55 -08:00
2014-04-03 07:21:21 -07:00
video_id = vdata [ ' id ' ]
2015-09-23 05:28:05 -07:00
title = vdata [ ' title ' ]
2014-04-03 07:21:21 -07:00
author = vdata . get ( ' author ' )
if author :
uploader = ' %s %s ' % ( author [ ' firstName ' ] , author [ ' lastName ' ] )
2014-12-12 06:55:55 -08:00
uploader_id = author . get ( ' id ' )
2014-04-03 07:21:21 -07:00
else :
uploader = None
uploader_id = None
2015-09-23 05:28:05 -07:00
mpx_account = data [ ' config ' ] [ ' uvpConfig ' ] [ ' default ' ] [ ' mpx_account ' ]
tp = ThePlatformIE ( self . _downloader )
formats = [ ]
subtitles = { }
description = vdata . get ( ' description ' )
2015-11-05 22:23:03 -08:00
for ( fkey , vid ) in vdata [ ' files ' ] . items ( ) :
if fkey == ' hls_phone ' and ' hls_tablet ' in vdata [ ' files ' ] :
continue
2015-09-23 05:28:05 -07:00
result = tp . extract ( ( ' http://link.theplatform.com/s/ %s / %s ' % ( mpx_account , vid ) ) )
formats . extend ( result [ ' formats ' ] )
subtitles = self . _merge_subtitles ( subtitles , result [ ' subtitles ' ] )
description = description or result . get ( ' description ' )
self . _sort_formats ( formats )
2014-04-03 07:21:21 -07:00
return {
' id ' : video_id ,
' display_id ' : display_id ,
' title ' : title ,
2015-09-23 05:28:05 -07:00
' description ' : description ,
2014-04-03 07:21:21 -07:00
' uploader ' : uploader ,
' uploader_id ' : uploader_id ,
2015-09-23 05:28:05 -07:00
' subtitles ' : subtitles ,
' formats ' : formats ,
2014-04-03 07:21:21 -07:00
}