2014-08-23 06:20:49 -07:00
# -*- coding: utf-8 -*-
from __future__ import unicode_literals
import json
import re
from . common import InfoExtractor
from . . utils import (
js_to_json ,
remove_end ,
)
class SBSIE ( InfoExtractor ) :
IE_DESC = ' sbs.com.au '
_VALID_URL = r ' https?://(?:www \ .)?sbs \ .com \ .au/ondemand/video/single/(?P<id>[0-9]+)/ '
_TESTS = [ {
# Original URL is handled by the generic IE which finds the iframe:
# http://www.sbs.com.au/thefeed/blog/2014/08/21/dingo-conservation
' url ' : ' http://www.sbs.com.au/ondemand/video/single/320403011771/?source=drupal&vertical=thefeed ' ,
' md5 ' : ' 3150cf278965eeabb5b4cea1c963fe0a ' ,
' info_dict ' : {
' id ' : ' 320403011771 ' ,
2014-09-21 07:08:38 -07:00
' ext ' : ' mp4 ' ,
2014-08-23 06:20:49 -07:00
' title ' : ' Dingo Conservation ' ,
' description ' : ' Dingoes are on the brink of extinction; most of the animals we think are dingoes are in fact crossbred with wild dogs. This family run a dingo conservation park to prevent their extinction ' ,
' thumbnail ' : ' re:http://.* \ .jpg ' ,
} ,
' add_ies ' : [ ' generic ' ] ,
} ]
def _real_extract ( self , url ) :
mobj = re . match ( self . _VALID_URL , url )
video_id = mobj . group ( ' id ' )
webpage = self . _download_webpage ( url , video_id )
release_urls_json = js_to_json ( self . _search_regex (
r ' (?s)playerParams \ .releaseUrls \ s*= \ s*( \ { .*? \ n \ }); \ n ' ,
webpage , ' ' ) )
release_urls = json . loads ( release_urls_json )
theplatform_url = (
release_urls . get ( ' progressive ' ) or release_urls . get ( ' standard ' ) )
title = remove_end ( self . _og_search_title ( webpage ) , ' (The Feed) ' )
description = self . _html_search_meta ( ' description ' , webpage )
thumbnail = self . _og_search_thumbnail ( webpage )
return {
' _type ' : ' url_transparent ' ,
' id ' : video_id ,
' url ' : theplatform_url ,
' title ' : title ,
' description ' : description ,
' thumbnail ' : thumbnail ,
}