youtube-dl/youtube_dl/extractor/spankbang.py

# coding: utf-8
from __future__ import unicode_literals

from .common import InfoExtractor
import re

class SpankBangIE(InfoExtractor):
    """Extractor for http://spankbang.com"""
    
    _VALID_URL = r"https?://(?:www\.)?spankbang\.com/(?P<id>\w+)/video/.*"
    
    _TEST = {
        "url": "http://spankbang.com/3vvn/video/fantasy+solo",
        "md5": "1cc433e1d6aa14bc376535b8679302f7",
        "info_dict": {
            "id": "3vvn",
            "title": "fantasy solo",
            "description": "Watch fantasy solo free HD porn video - 05 minutes - dillion harper masturbates on a bed free adult movies.",
            "format": "720p",
            "format_id": "720p",
            "ext": "mp4",
            "url": "re:http://spankbang.com/_3vvn/IjE0MjgyNjY5MTcuMzUi.IaGrcF-vDrvktMhjd-1fWixiCzU/title/720p__mp4"
        }
    }

    def _real_extract(self, url):
        video_id = self._match_id(url)
        webpage = self._download_webpage(url, video_id)

        title = self._html_search_regex(r"<h1>(?:<img.+?>)?(.*?)</h1>", webpage, "title")
        
        stream_key = self._html_search_regex(r"""var\s+stream_key\s*[=]\s*['"](.+?)['"]\s*;""", webpage, "stream_key")
        
        qualities = re.findall(r"<span.+?>([0-9]+p).*?</span>", webpage)
        
        formats = []
        for q in sorted(qualities):
            formats.append({
                "format_id": q,
                "format": q,
                "ext": "mp4",
                "url": "http://spankbang.com/_{0}/{1}/title/{2}__mp4".format(video_id, stream_key, q)
            })

        return {
            "id": video_id,
            "title": title,
            "description": self._og_search_description(webpage),
            "formats": formats
        }

# vim: tabstop=4 expandtab
[SpankBang] Add new extractor 2015-04-05 12:50:21 -07:00			`# coding: utf-8`
			`from __future__ import unicode_literals`

			`from .common import InfoExtractor`
			`import re`

			`class SpankBangIE(InfoExtractor):`
			`"""Extractor for http://spankbang.com"""`

			`_VALID_URL = r"https?://(?:www\.)?spankbang\.com/(?P<id>\w+)/video/.*"`
[SpankBang] Add test 2015-04-05 13:57:59 -07:00
			`_TEST = {`
			`"url": "http://spankbang.com/3vvn/video/fantasy+solo",`
			`"md5": "1cc433e1d6aa14bc376535b8679302f7",`
			`"info_dict": {`
			`"id": "3vvn",`
			`"title": "fantasy solo",`
			`"description": "Watch fantasy solo free HD porn video - 05 minutes - dillion harper masturbates on a bed free adult movies.",`
			`"format": "720p",`
			`"format_id": "720p",`
			`"ext": "mp4",`
			`"url": "re:http://spankbang.com/_3vvn/IjE0MjgyNjY5MTcuMzUi.IaGrcF-vDrvktMhjd-1fWixiCzU/title/720p__mp4"`
			`}`
			`}`
[SpankBang] Add new extractor 2015-04-05 12:50:21 -07:00
			`def _real_extract(self, url):`
			`video_id = self._match_id(url)`
			`webpage = self._download_webpage(url, video_id)`

			`title = self._html_search_regex(r"<h1>(?:<img.+?>)?(.*?)</h1>", webpage, "title")`

			`stream_key = self._html_search_regex(r"""var\s+stream_key\s[=]\s['"](.+?)['"]\s*;""", webpage, "stream_key")`

			`qualities = re.findall(r"<span.+?>([0-9]+p).*?</span>", webpage)`

			`formats = []`
			`for q in sorted(qualities):`
			`formats.append({`
			`"format_id": q,`
			`"format": q,`
			`"ext": "mp4",`
[SpankBang] Use python2.6 compatible string formatting spec 2015-04-05 13:43:21 -07:00			`"url": "http://spankbang.com/_{0}/{1}/title/{2}__mp4".format(video_id, stream_key, q)`
[SpankBang] Add new extractor 2015-04-05 12:50:21 -07:00			`})`

			`return {`
			`"id": video_id,`
			`"title": title,`
			`"description": self._og_search_description(webpage),`
			`"formats": formats`
			`}`

			`# vim: tabstop=4 expandtab`