youtube-dl/youtube_dl/extractor/brightcove.py

# encoding: utf-8
from __future__ import unicode_literals

import re
import json
import xml.etree.ElementTree

from .common import InfoExtractor
from ..utils import (
    compat_urllib_parse,
    find_xpath_attr,
    compat_urlparse,
    compat_str,
    compat_urllib_request,

    ExtractorError,
    unsmuggle_url,
)


class BrightcoveIE(InfoExtractor):
    _VALID_URL = r'https?://.*brightcove\.com/(services|viewer).*\?(?P<query>.*)'
    _FEDERATED_URL_TEMPLATE = 'http://c.brightcove.com/services/viewer/htmlFederated?%s'
    _PLAYLIST_URL_TEMPLATE = 'http://c.brightcove.com/services/json/experience/runtime/?command=get_programming_for_experience&playerKey=%s'

    _TESTS = [
        {
            # From http://www.8tv.cat/8aldia/videos/xavier-sala-i-martin-aquesta-tarda-a-8-al-dia/
            'url': 'http://c.brightcove.com/services/viewer/htmlFederated?playerID=1654948606001&flashID=myExperience&%40videoPlayer=2371591881001',
            'file': '2371591881001.mp4',
            'md5': '5423e113865d26e40624dce2e4b45d95',
            'note': 'Test Brightcove downloads and detection in GenericIE',
            'info_dict': {
                'title': 'Xavier Sala i Martín: “Un banc que no presta és un banc zombi que no serveix per a res”',
                'uploader': '8TV',
                'description': 'md5:a950cc4285c43e44d763d036710cd9cd',
            }
        },
        {
            # From http://medianetwork.oracle.com/video/player/1785452137001
            'url': 'http://c.brightcove.com/services/viewer/htmlFederated?playerID=1217746023001&flashID=myPlayer&%40videoPlayer=1785452137001',
            'file': '1785452137001.flv',
            'info_dict': {
                'title': 'JVMLS 2012: Arrays 2.0 - Opportunities and Challenges',
                'description': 'John Rose speaks at the JVM Language Summit, August 1, 2012.',
                'uploader': 'Oracle',
            },
        },
        {
            # From http://mashable.com/2013/10/26/thermoelectric-bracelet-lets-you-control-your-body-temperature/
            'url': 'http://c.brightcove.com/services/viewer/federated_f9?&playerID=1265504713001&publisherID=AQ%7E%7E%2CAAABBzUwv1E%7E%2CxP-xFHVUstiMFlNYfvF4G9yFnNaqCw_9&videoID=2750934548001',
            'info_dict': {
                'id': '2750934548001',
                'ext': 'mp4',
                'title': 'This Bracelet Acts as a Personal Thermostat',
                'description': 'md5:547b78c64f4112766ccf4e151c20b6a0',
                'uploader': 'Mashable',
            },
        },
        {
            # test that the default referer works
            # from http://national.ballet.ca/interact/video/Lost_in_Motion_II/
            'url': 'http://link.brightcove.com/services/player/bcpid756015033001?bckey=AQ~~,AAAApYJi_Ck~,GxhXCegT1Dp39ilhXuxMJxasUhVNZiil&bctid=2878862109001',
            'info_dict': {
                'id': '2878862109001',
                'ext': 'mp4',
                'title': 'Lost in Motion II',
                'description': 'md5:363109c02998fee92ec02211bd8000df',
                'uploader': 'National Ballet of Canada',
            },
        },
    ]

    @classmethod
    def _build_brighcove_url(cls, object_str):
        """
        Build a Brightcove url from a xml string containing
        <object class="BrightcoveExperience">{params}</object>
        """

        # Fix up some stupid HTML, see https://github.com/rg3/youtube-dl/issues/1553
        object_str = re.sub(r'(<param name="[^"]+" value="[^"]+")>',
                            lambda m: m.group(1) + '/>', object_str)
        # Fix up some stupid XML, see https://github.com/rg3/youtube-dl/issues/1608
        object_str = object_str.replace('<--', '<!--')

        object_doc = xml.etree.ElementTree.fromstring(object_str)
        assert 'BrightcoveExperience' in object_doc.attrib['class']
        params = {
            'playerID': find_xpath_attr(object_doc, './param', 'name', 'playerID').attrib['value'],
        }
        def find_param(name):
            node = find_xpath_attr(object_doc, './param', 'name', name)
            if node is not None:
                return node.attrib['value']
            return None
        playerKey = find_param('playerKey')
        # Not all pages define this value
        if playerKey is not None:
            params['playerKey'] = playerKey
        # The three fields hold the id of the video
        videoPlayer = find_param('@videoPlayer') or find_param('videoId') or find_param('videoID')
        if videoPlayer is not None:
            params['@videoPlayer'] = videoPlayer
        linkBase = find_param('linkBaseURL')
        if linkBase is not None:
            params['linkBaseURL'] = linkBase
        data = compat_urllib_parse.urlencode(params)
        return cls._FEDERATED_URL_TEMPLATE % data

    @classmethod
    def _extract_brightcove_url(cls, webpage):
        """Try to extract the brightcove url from the wepbage, returns None
        if it can't be found
        """
        m_brightcove = re.search(
            r'<object[^>]+?class=([\'"])[^>]*?BrightcoveExperience.*?\1.+?</object>',
            webpage, re.DOTALL)
        if m_brightcove is not None:
            return cls._build_brighcove_url(m_brightcove.group())
        else:
            return None

    def _real_extract(self, url):
        url, smuggled_data = unsmuggle_url(url, {})

        # Change the 'videoId' and others field to '@videoPlayer'
        url = re.sub(r'(?<=[?&])(videoI(d|D)|bctid)', '%40videoPlayer', url)
        # Change bckey (used by bcove.me urls) to playerKey
        url = re.sub(r'(?<=[?&])bckey', 'playerKey', url)
        mobj = re.match(self._VALID_URL, url)
        query_str = mobj.group('query')
        query = compat_urlparse.parse_qs(query_str)

        videoPlayer = query.get('@videoPlayer')
        if videoPlayer:
            # We set the original url as the default 'Referer' header
            referer = smuggled_data.get('Referer', url)
            return self._get_video_info(
                videoPlayer[0], query_str, query, referer=referer)
        else:
            player_key = query['playerKey']
            return self._get_playlist_info(player_key[0])

    def _get_video_info(self, video_id, query_str, query, referer=None):
        request_url = self._FEDERATED_URL_TEMPLATE % query_str
        req = compat_urllib_request.Request(request_url)
        linkBase = query.get('linkBaseURL')
        if linkBase is not None:
            referer = linkBase[0]
        if referer is not None:
            req.add_header('Referer', referer)
        webpage = self._download_webpage(req, video_id)

        self.report_extraction(video_id)
        info = self._search_regex(r'var experienceJSON = ({.*?});', webpage, 'json')
        info = json.loads(info)['data']
        video_info = info['programmedContent']['videoPlayer']['mediaDTO']

        return self._extract_video_info(video_info)

    def _get_playlist_info(self, player_key):
        playlist_info = self._download_webpage(self._PLAYLIST_URL_TEMPLATE % player_key,
                                               player_key, 'Downloading playlist information')

        json_data = json.loads(playlist_info)
        if 'videoList' not in json_data:
            raise ExtractorError('Empty playlist')
        playlist_info = json_data['videoList']
        videos = [self._extract_video_info(video_info) for video_info in playlist_info['mediaCollectionDTO']['videoDTOs']]

        return self.playlist_result(videos, playlist_id=playlist_info['id'],
                                    playlist_title=playlist_info['mediaCollectionDTO']['displayName'])

    def _extract_video_info(self, video_info):
        info = {
            'id': compat_str(video_info['id']),
            'title': video_info['displayName'],
            'description': video_info.get('shortDescription'),
            'thumbnail': video_info.get('videoStillURL') or video_info.get('thumbnailURL'),
            'uploader': video_info.get('publisherName'),
        }

        renditions = video_info.get('renditions')
        if renditions:
            renditions = sorted(renditions, key=lambda r: r['size'])
            info['formats'] = [{
                'url': rend['defaultURL'],
                'height': rend.get('frameHeight'),
                'width': rend.get('frameWidth'),
            } for rend in renditions]
        elif video_info.get('FLVFullLengthURL') is not None:
            info.update({
                'url': video_info['FLVFullLengthURL'],
            })
        else:
            raise ExtractorError('Unable to extract video url for %s' % info['id'])
        return info
[brightcove] Support videos that only provide flv versions (fixes #1504) Moved the test from generic.py to brightcove.py 2013-09-26 19:53:57 +08:00			`# encoding: utf-8`
[brightcove] Use unicode_literals 2014-01-07 12:23:20 +08:00			`from __future__ import unicode_literals`
[brightcove] Support videos that only provide flv versions (fixes #1504) Moved the test from generic.py to brightcove.py 2013-09-26 19:53:57 +08:00
Add BrightcoveIE (closes #832) It only accepts the urls that are use for embedding the video, it doesn't search in generic webpages to find Brightcove videos 2013-07-06 03:31:50 +08:00			`import re`
			`import json`
GenericIE: Detect videos from Brightcove Brightcove videos info is usually found in an <object class="BrightcoveExperience"></object> node, this is passed to a new method of BrightcoveIE that builds a url to extract the video. 2013-07-10 23:49:11 +08:00			`import xml.etree.ElementTree`
Add BrightcoveIE (closes #832) It only accepts the urls that are use for embedding the video, it doesn't search in generic webpages to find Brightcove videos 2013-07-06 03:31:50 +08:00
			`from .common import InfoExtractor`
GenericIE: Detect videos from Brightcove Brightcove videos info is usually found in an <object class="BrightcoveExperience"></object> node, this is passed to a new method of BrightcoveIE that builds a url to extract the video. 2013-07-10 23:49:11 +08:00			`from ..utils import (`
			`compat_urllib_parse,`
[brightcove] add import 2013-07-11 22:31:29 +08:00			`find_xpath_attr,`
BrightcoveIE: Use parse_qs to extract the fields of the query (closes #1032) Add a compat_urlparse to utils. 2013-07-12 20:53:28 +08:00			`compat_urlparse,`
[brightcove] Add the extraction of the url from generic 2013-11-06 23:40:24 +08:00			`compat_str,`
[brightcove] Set the 'Referer' header if the url has the 'linkBaseUrl' parameter (fixes #1553) 2013-11-08 04:06:48 +08:00			`compat_urllib_request,`
[brightcove] Support videos that only provide flv versions (fixes #1504) Moved the test from generic.py to brightcove.py 2013-09-26 19:53:57 +08:00
			`ExtractorError,`
Use original Referer URL in Brightcove requests (Fixes #2110) 2014-01-07 12:34:14 +08:00			`unsmuggle_url,`
GenericIE: Detect videos from Brightcove Brightcove videos info is usually found in an <object class="BrightcoveExperience"></object> node, this is passed to a new method of BrightcoveIE that builds a url to extract the video. 2013-07-10 23:49:11 +08:00			`)`
Add BrightcoveIE (closes #832) It only accepts the urls that are use for embedding the video, it doesn't search in generic webpages to find Brightcove videos 2013-07-06 03:31:50 +08:00
[brightcove] Set the 'Referer' header if the url has the 'linkBaseUrl' parameter (fixes #1553) 2013-11-08 04:06:48 +08:00
Add BrightcoveIE (closes #832) It only accepts the urls that are use for embedding the video, it doesn't search in generic webpages to find Brightcove videos 2013-07-06 03:31:50 +08:00			`class BrightcoveIE(InfoExtractor):`
BrightcoveIE: add support for playlists 2013-07-11 06:04:33 +08:00			`_VALID_URL = r'https?://.brightcove\.com/(services\|viewer).\?(?P<query>.*)'`
GenericIE: Detect videos from Brightcove Brightcove videos info is usually found in an <object class="BrightcoveExperience"></object> node, this is passed to a new method of BrightcoveIE that builds a url to extract the video. 2013-07-10 23:49:11 +08:00			`_FEDERATED_URL_TEMPLATE = 'http://c.brightcove.com/services/viewer/htmlFederated?%s'`
BrightcoveIE: add support for playlists 2013-07-11 06:04:33 +08:00			`_PLAYLIST_URL_TEMPLATE = 'http://c.brightcove.com/services/json/experience/runtime/?command=get_programming_for_experience&playerKey=%s'`
[brightcove] Support videos that only provide flv versions (fixes #1504) Moved the test from generic.py to brightcove.py 2013-09-26 19:53:57 +08:00
			`_TESTS = [`
			`{`
[brightcove] Use direct url for the tests The test_all_urls.py test failed because BrightcoveIE doesn't match them. 2013-09-27 00:59:56 +08:00			`# From http://www.8tv.cat/8aldia/videos/xavier-sala-i-martin-aquesta-tarda-a-8-al-dia/`
[brightcove] Use unicode_literals 2014-01-07 12:23:20 +08:00			`'url': 'http://c.brightcove.com/services/viewer/htmlFederated?playerID=1654948606001&flashID=myExperience&%40videoPlayer=2371591881001',`
			`'file': '2371591881001.mp4',`
			`'md5': '5423e113865d26e40624dce2e4b45d95',`
			`'note': 'Test Brightcove downloads and detection in GenericIE',`
			`'info_dict': {`
			`'title': 'Xavier Sala i Martín: “Un banc que no presta és un banc zombi que no serveix per a res”',`
			`'uploader': '8TV',`
			`'description': 'md5:a950cc4285c43e44d763d036710cd9cd',`
[brightcove] Support videos that only provide flv versions (fixes #1504) Moved the test from generic.py to brightcove.py 2013-09-26 19:53:57 +08:00			`}`
			`},`
			`{`
[brightcove] Use direct url for the tests The test_all_urls.py test failed because BrightcoveIE doesn't match them. 2013-09-27 00:59:56 +08:00			`# From http://medianetwork.oracle.com/video/player/1785452137001`
[brightcove] Use unicode_literals 2014-01-07 12:23:20 +08:00			`'url': 'http://c.brightcove.com/services/viewer/htmlFederated?playerID=1217746023001&flashID=myPlayer&%40videoPlayer=1785452137001',`
			`'file': '1785452137001.flv',`
			`'info_dict': {`
			`'title': 'JVMLS 2012: Arrays 2.0 - Opportunities and Challenges',`
			`'description': 'John Rose speaks at the JVM Language Summit, August 1, 2012.',`
			`'uploader': 'Oracle',`
[brightcove] Support videos that only provide flv versions (fixes #1504) Moved the test from generic.py to brightcove.py 2013-09-26 19:53:57 +08:00			`},`
			`},`
[brightcove] Change the 'videoId' or 'videoID' field to '@videoPlayer' (fixes #1697) It seems to be needed when using the htmlFederated page 2013-11-07 00:25:38 +08:00			`{`
			`# From http://mashable.com/2013/10/26/thermoelectric-bracelet-lets-you-control-your-body-temperature/`
[brightcove] Use unicode_literals 2014-01-07 12:23:20 +08:00			`'url': 'http://c.brightcove.com/services/viewer/federated_f9?&playerID=1265504713001&publisherID=AQ%7E%7E%2CAAABBzUwv1E%7E%2CxP-xFHVUstiMFlNYfvF4G9yFnNaqCw_9&videoID=2750934548001',`
			`'info_dict': {`
			`'id': '2750934548001',`
			`'ext': 'mp4',`
			`'title': 'This Bracelet Acts as a Personal Thermostat',`
			`'description': 'md5:547b78c64f4112766ccf4e151c20b6a0',`
			`'uploader': 'Mashable',`
[brightcove] Change the 'videoId' or 'videoID' field to '@videoPlayer' (fixes #1697) It seems to be needed when using the htmlFederated page 2013-11-07 00:25:38 +08:00			`},`
			`},`
[brightcove] Use the original url (usually the player) as the default referer (fixes #1929) 2013-12-10 03:01:43 +08:00			`{`
			`# test that the default referer works`
			`# from http://national.ballet.ca/interact/video/Lost_in_Motion_II/`
[brightcove] Use unicode_literals 2014-01-07 12:23:20 +08:00			`'url': 'http://link.brightcove.com/services/player/bcpid756015033001?bckey=AQ~~,AAAApYJi_Ck~,GxhXCegT1Dp39ilhXuxMJxasUhVNZiil&bctid=2878862109001',`
			`'info_dict': {`
			`'id': '2878862109001',`
			`'ext': 'mp4',`
			`'title': 'Lost in Motion II',`
			`'description': 'md5:363109c02998fee92ec02211bd8000df',`
			`'uploader': 'National Ballet of Canada',`
[brightcove] Use the original url (usually the player) as the default referer (fixes #1929) 2013-12-10 03:01:43 +08:00			`},`
			`},`
[brightcove] Support videos that only provide flv versions (fixes #1504) Moved the test from generic.py to brightcove.py 2013-09-26 19:53:57 +08:00			`]`
GenericIE: Detect videos from Brightcove Brightcove videos info is usually found in an <object class="BrightcoveExperience"></object> node, this is passed to a new method of BrightcoveIE that builds a url to extract the video. 2013-07-10 23:49:11 +08:00
			`@classmethod`
			`def _build_brighcove_url(cls, object_str):`
			`"""`
			`Build a Brightcove url from a xml string containing`
			`<object class="BrightcoveExperience">{params}</object>`
			`"""`
[brightcove] Fix up some broken HTML (#1553) 2013-10-04 17:53:49 +08:00
			`# Fix up some stupid HTML, see https://github.com/rg3/youtube-dl/issues/1553`
			`object_str = re.sub(r'(<param name="[^"]+" value="[^"]+")>',`
			`lambda m: m.group(1) + '/>', object_str)`
[brightcove] Fix more broken XML (#1608) 2013-10-17 06:46:11 +08:00			`# Fix up some stupid XML, see https://github.com/rg3/youtube-dl/issues/1608`
[brightcove] Use unicode_literals 2014-01-07 12:23:20 +08:00			`object_str = object_str.replace('<--', '<!--')`
[brightcove] Fix up some broken HTML (#1553) 2013-10-04 17:53:49 +08:00
GenericIE: Detect videos from Brightcove Brightcove videos info is usually found in an <object class="BrightcoveExperience"></object> node, this is passed to a new method of BrightcoveIE that builds a url to extract the video. 2013-07-10 23:49:11 +08:00			`object_doc = xml.etree.ElementTree.fromstring(object_str)`
[brightcove] Use unicode_literals 2014-01-07 12:23:20 +08:00			`assert 'BrightcoveExperience' in object_doc.attrib['class']`
[brightcove] The ‘id’ attribute is not always present in the object tag (fixes #2132) It looks like the ‘flashId’ parameter is not needed. 2014-01-11 02:39:42 +08:00			`params = {`
			`'playerID': find_xpath_attr(object_doc, './param', 'name', 'playerID').attrib['value'],`
			`}`
[brightcove] Set the 'videoPlayer' value to the 'videoId' if it's missing in the parameters (fixes #1815) 2013-11-24 06:26:06 +08:00			`def find_param(name):`
[brightcove] Don't use 'or' with the xml nodes, use the 'value' attribute instead 2013-11-24 18:02:34 +08:00			`node = find_xpath_attr(object_doc, './param', 'name', name)`
			`if node is not None:`
			`return node.attrib['value']`
			`return None`
[brightcove] Set the 'videoPlayer' value to the 'videoId' if it's missing in the parameters (fixes #1815) 2013-11-24 06:26:06 +08:00			`playerKey = find_param('playerKey')`
GenericIE: Detect videos from Brightcove Brightcove videos info is usually found in an <object class="BrightcoveExperience"></object> node, this is passed to a new method of BrightcoveIE that builds a url to extract the video. 2013-07-10 23:49:11 +08:00			`# Not all pages define this value`
			`if playerKey is not None:`
[brightcove] Don't use 'or' with the xml nodes, use the 'value' attribute instead 2013-11-24 18:02:34 +08:00			`params['playerKey'] = playerKey`
[brightcove] Set the 'videoPlayer' value to the 'videoId' if it's missing in the parameters (fixes #1815) 2013-11-24 06:26:06 +08:00			`# The three fields hold the id of the video`
			`videoPlayer = find_param('@videoPlayer') or find_param('videoId') or find_param('videoID')`
BrightcoveIE: add support for playlists 2013-07-11 06:04:33 +08:00			`if videoPlayer is not None:`
[brightcove] Don't use 'or' with the xml nodes, use the 'value' attribute instead 2013-11-24 18:02:34 +08:00			`params['@videoPlayer'] = videoPlayer`
[brightcove] Set the 'videoPlayer' value to the 'videoId' if it's missing in the parameters (fixes #1815) 2013-11-24 06:26:06 +08:00			`linkBase = find_param('linkBaseURL')`
[brightcove] Set the 'Referer' header if the url has the 'linkBaseUrl' parameter (fixes #1553) 2013-11-08 04:06:48 +08:00			`if linkBase is not None:`
[brightcove] Don't use 'or' with the xml nodes, use the 'value' attribute instead 2013-11-24 18:02:34 +08:00			`params['linkBaseURL'] = linkBase`
GenericIE: Detect videos from Brightcove Brightcove videos info is usually found in an <object class="BrightcoveExperience"></object> node, this is passed to a new method of BrightcoveIE that builds a url to extract the video. 2013-07-10 23:49:11 +08:00			`data = compat_urllib_parse.urlencode(params)`
			`return cls._FEDERATED_URL_TEMPLATE % data`
Add BrightcoveIE (closes #832) It only accepts the urls that are use for embedding the video, it doesn't search in generic webpages to find Brightcove videos 2013-07-06 03:31:50 +08:00
[brightcove] Add the extraction of the url from generic 2013-11-06 23:40:24 +08:00			`@classmethod`
			`def _extract_brightcove_url(cls, webpage):`
			`"""Try to extract the brightcove url from the wepbage, returns None`
			`if it can't be found`
			`"""`
			`m_brightcove = re.search(`
			`r'<object[^>]+?class=([\'"])[^>]?BrightcoveExperience.?\1.+?</object>',`
			`webpage, re.DOTALL)`
			`if m_brightcove is not None:`
			`return cls._build_brighcove_url(m_brightcove.group())`
			`else:`
			`return None`

Add BrightcoveIE (closes #832) It only accepts the urls that are use for embedding the video, it doesn't search in generic webpages to find Brightcove videos 2013-07-06 03:31:50 +08:00			`def _real_extract(self, url):`
Use original Referer URL in Brightcove requests (Fixes #2110) 2014-01-07 12:34:14 +08:00			`url, smuggled_data = unsmuggle_url(url, {})`

[brightcove] Support redirected urls from bcove.me (fixes #1732) 'bctid' needs to be changed to '@videoPlayer', and 'bckey' to 'playerKey'. 2013-11-07 05:03:00 +08:00			`# Change the 'videoId' and others field to '@videoPlayer'`
			`url = re.sub(r'(?<=[?&])(videoI(d\|D)\|bctid)', '%40videoPlayer', url)`
			`# Change bckey (used by bcove.me urls) to playerKey`
			`url = re.sub(r'(?<=[?&])bckey', 'playerKey', url)`
Add BrightcoveIE (closes #832) It only accepts the urls that are use for embedding the video, it doesn't search in generic webpages to find Brightcove videos 2013-07-06 03:31:50 +08:00			`mobj = re.match(self._VALID_URL, url)`
BrightcoveIE: Use parse_qs to extract the fields of the query (closes #1032) Add a compat_urlparse to utils. 2013-07-12 20:53:28 +08:00			`query_str = mobj.group('query')`
			`query = compat_urlparse.parse_qs(query_str)`
Add BrightcoveIE (closes #832) It only accepts the urls that are use for embedding the video, it doesn't search in generic webpages to find Brightcove videos 2013-07-06 03:31:50 +08:00
BrightcoveIE: Use parse_qs to extract the fields of the query (closes #1032) Add a compat_urlparse to utils. 2013-07-12 20:53:28 +08:00			`videoPlayer = query.get('@videoPlayer')`
			`if videoPlayer:`
Use original Referer URL in Brightcove requests (Fixes #2110) 2014-01-07 12:34:14 +08:00			`# We set the original url as the default 'Referer' header`
			`referer = smuggled_data.get('Referer', url)`
			`return self._get_video_info(`
			`videoPlayer[0], query_str, query, referer=referer)`
BrightcoveIE: add support for playlists 2013-07-11 06:04:33 +08:00			`else:`
BrightcoveIE: Use parse_qs to extract the fields of the query (closes #1032) Add a compat_urlparse to utils. 2013-07-12 20:53:28 +08:00			`player_key = query['playerKey']`
			`return self._get_playlist_info(player_key[0])`
BrightcoveIE: add support for playlists 2013-07-11 06:04:33 +08:00
[brightcove] Use the original url (usually the player) as the default referer (fixes #1929) 2013-12-10 03:01:43 +08:00			`def _get_video_info(self, video_id, query_str, query, referer=None):`
[brightcove] Set the 'Referer' header if the url has the 'linkBaseUrl' parameter (fixes #1553) 2013-11-08 04:06:48 +08:00			`request_url = self._FEDERATED_URL_TEMPLATE % query_str`
			`req = compat_urllib_request.Request(request_url)`
			`linkBase = query.get('linkBaseURL')`
			`if linkBase is not None:`
[brightcove] Use the original url (usually the player) as the default referer (fixes #1929) 2013-12-10 03:01:43 +08:00			`referer = linkBase[0]`
			`if referer is not None:`
			`req.add_header('Referer', referer)`
[brightcove] Set the 'Referer' header if the url has the 'linkBaseUrl' parameter (fixes #1553) 2013-11-08 04:06:48 +08:00			`webpage = self._download_webpage(req, video_id)`
Add BrightcoveIE (closes #832) It only accepts the urls that are use for embedding the video, it doesn't search in generic webpages to find Brightcove videos 2013-07-06 03:31:50 +08:00
			`self.report_extraction(video_id)`
			`info = self._search_regex(r'var experienceJSON = ({.*?});', webpage, 'json')`
			`info = json.loads(info)['data']`
			`video_info = info['programmedContent']['videoPlayer']['mediaDTO']`
BrightcoveIE: add support for playlists 2013-07-11 06:04:33 +08:00
			`return self._extract_video_info(video_info)`

			`def _get_playlist_info(self, player_key):`
			`playlist_info = self._download_webpage(self._PLAYLIST_URL_TEMPLATE % player_key,`
[brightcove] Use unicode_literals 2014-01-07 12:23:20 +08:00			`player_key, 'Downloading playlist information')`
BrightcoveIE: add support for playlists 2013-07-11 06:04:33 +08:00
[brightcove] Raise error if playlist is empty (#1608) 2013-10-17 07:02:17 +08:00			`json_data = json.loads(playlist_info)`
			`if 'videoList' not in json_data:`
[brightcove] Use unicode_literals 2014-01-07 12:23:20 +08:00			`raise ExtractorError('Empty playlist')`
[brightcove] Raise error if playlist is empty (#1608) 2013-10-17 07:02:17 +08:00			`playlist_info = json_data['videoList']`
BrightcoveIE: add support for playlists 2013-07-11 06:04:33 +08:00			`videos = [self._extract_video_info(video_info) for video_info in playlist_info['mediaCollectionDTO']['videoDTOs']]`

			`return self.playlist_result(videos, playlist_id=playlist_info['id'],`
			`playlist_title=playlist_info['mediaCollectionDTO']['displayName'])`

			`def _extract_video_info(self, video_info):`
[brightcove] Support videos that only provide flv versions (fixes #1504) Moved the test from generic.py to brightcove.py 2013-09-26 19:53:57 +08:00			`info = {`
[brightcove] Add the extraction of the url from generic 2013-11-06 23:40:24 +08:00			`'id': compat_str(video_info['id']),`
[brightcove] Support videos that only provide flv versions (fixes #1504) Moved the test from generic.py to brightcove.py 2013-09-26 19:53:57 +08:00			`'title': video_info['displayName'],`
			`'description': video_info.get('shortDescription'),`
			`'thumbnail': video_info.get('videoStillURL') or video_info.get('thumbnailURL'),`
			`'uploader': video_info.get('publisherName'),`
			`}`
BrightcoveIE: add support for playlists 2013-07-11 06:04:33 +08:00
[brightcove] Support videos that only provide flv versions (fixes #1504) Moved the test from generic.py to brightcove.py 2013-09-26 19:53:57 +08:00			`renditions = video_info.get('renditions')`
			`if renditions:`
			`renditions = sorted(renditions, key=lambda r: r['size'])`
[brightcove] Extract all the available formats 2013-11-07 02:05:41 +08:00			`info['formats'] = [{`
			`'url': rend['defaultURL'],`
			`'height': rend.get('frameHeight'),`
			`'width': rend.get('frameWidth'),`
			`} for rend in renditions]`
[brightcove] Support videos that only provide flv versions (fixes #1504) Moved the test from generic.py to brightcove.py 2013-09-26 19:53:57 +08:00			`elif video_info.get('FLVFullLengthURL') is not None:`
			`info.update({`
			`'url': video_info['FLVFullLengthURL'],`
			`})`
			`else:`
[brightcove] Use unicode_literals 2014-01-07 12:23:20 +08:00			`raise ExtractorError('Unable to extract video url for %s' % info['id'])`
[brightcove] Support videos that only provide flv versions (fixes #1504) Moved the test from generic.py to brightcove.py 2013-09-26 19:53:57 +08:00			`return info`