youtube-dl/youtube_dl/extractor/rutube.py

# coding: utf-8
from __future__ import unicode_literals

import re
import itertools

from .common import InfoExtractor
from ..compat import (
    compat_str,
    compat_parse_qs,
    compat_urllib_parse_urlparse,
)
from ..utils import (
    determine_ext,
    bool_or_none,
    int_or_none,
    try_get,
    unified_timestamp,
    url_or_none,
)


class RutubeBaseIE(InfoExtractor):
    def _extract_video(self, video, video_id=None, require_title=True):
        title = video['title'] if require_title else video.get('title')

        age_limit = video.get('is_adult')
        if age_limit is not None:
            age_limit = 18 if age_limit is True else 0

        uploader_id = try_get(video, lambda x: x['author']['id'])
        category = try_get(video, lambda x: x['category']['name'])

        return {
            'id': video.get('id') or video_id,
            'title': title,
            'description': video.get('description'),
            'thumbnail': video.get('thumbnail_url'),
            'duration': int_or_none(video.get('duration')),
            'uploader': try_get(video, lambda x: x['author']['name']),
            'uploader_id': compat_str(uploader_id) if uploader_id else None,
            'timestamp': unified_timestamp(video.get('created_ts')),
            'category': [category] if category else None,
            'age_limit': age_limit,
            'view_count': int_or_none(video.get('hits')),
            'comment_count': int_or_none(video.get('comments_count')),
            'is_live': bool_or_none(video.get('is_livestream')),
        }


class RutubeIE(RutubeBaseIE):
    IE_NAME = 'rutube'
    IE_DESC = 'Rutube videos'
    _VALID_URL = r'https?://rutube\.ru/(?:video|(?:play/)?embed)/(?P<id>[\da-z]{32})'

    _TESTS = [{
        'url': 'http://rutube.ru/video/3eac3b4561676c17df9132a9a1e62e3e/',
        'md5': '79938ade01294ef7e27574890d0d3769',
        'info_dict': {
            'id': '3eac3b4561676c17df9132a9a1e62e3e',
            'ext': 'flv',
            'title': 'Раненный кенгуру забежал в аптеку',
            'description': 'http://www.ntdtv.ru ',
            'duration': 80,
            'uploader': 'NTDRussian',
            'uploader_id': '29790',
            'timestamp': 1381943602,
            'upload_date': '20131016',
            'age_limit': 0,
        },
    }, {
        'url': 'http://rutube.ru/play/embed/a10e53b86e8f349080f718582ce4c661',
        'only_matching': True,
    }, {
        'url': 'http://rutube.ru/embed/a10e53b86e8f349080f718582ce4c661',
        'only_matching': True,
    }, {
        'url': 'http://rutube.ru/video/3eac3b4561676c17df9132a9a1e62e3e/?pl_id=4252',
        'only_matching': True,
    }, {
        'url': 'https://rutube.ru/video/10b3a03fc01d5bbcc632a2f3514e8aab/?pl_type=source',
        'only_matching': True,
    }]

    @classmethod
    def suitable(cls, url):
        return False if RutubePlaylistIE.suitable(url) else super(RutubeIE, cls).suitable(url)

    @staticmethod
    def _extract_urls(webpage):
        return [mobj.group('url') for mobj in re.finditer(
            r'<iframe[^>]+?src=(["\'])(?P<url>(?:https?:)?//rutube\.ru/embed/[\da-z]{32}.*?)\1',
            webpage)]

    def _real_extract(self, url):
        video_id = self._match_id(url)

        video = self._download_json(
            'http://rutube.ru/api/video/%s/?format=json' % video_id,
            video_id, 'Downloading video JSON')

        info = self._extract_video(video, video_id)

        options = self._download_json(
            'http://rutube.ru/api/play/options/%s/?format=json' % video_id,
            video_id, 'Downloading options JSON',
            headers=self.geo_verification_headers())

        formats = []
        for format_id, format_url in options['video_balancer'].items():
            ext = determine_ext(format_url)
            if ext == 'm3u8':
                formats.extend(self._extract_m3u8_formats(
                    format_url, video_id, 'mp4', m3u8_id=format_id, fatal=False))
            elif ext == 'f4m':
                formats.extend(self._extract_f4m_formats(
                    format_url, video_id, f4m_id=format_id, fatal=False))
            else:
                formats.append({
                    'url': format_url,
                    'format_id': format_id,
                })
        self._sort_formats(formats)

        info['formats'] = formats
        return info


class RutubeEmbedIE(InfoExtractor):
    IE_NAME = 'rutube:embed'
    IE_DESC = 'Rutube embedded videos'
    _VALID_URL = r'https?://rutube\.ru/(?:video|play)/embed/(?P<id>[0-9]+)'

    _TESTS = [{
        'url': 'http://rutube.ru/video/embed/6722881?vk_puid37=&vk_puid38=',
        'info_dict': {
            'id': 'a10e53b86e8f349080f718582ce4c661',
            'ext': 'flv',
            'timestamp': 1387830582,
            'upload_date': '20131223',
            'uploader_id': '297833',
            'description': 'Видео группы ★http://vk.com/foxkidsreset★ музей Fox Kids и Jetix<br/><br/> восстановлено и сделано в шикоформате subziro89 http://vk.com/subziro89',
            'uploader': 'subziro89 ILya',
            'title': 'Мистический городок Эйри в Индиан 5 серия озвучка subziro89',
        },
        'params': {
            'skip_download': True,
        },
    }, {
        'url': 'http://rutube.ru/play/embed/8083783',
        'only_matching': True,
    }]

    def _real_extract(self, url):
        embed_id = self._match_id(url)
        webpage = self._download_webpage(url, embed_id)

        canonical_url = self._html_search_regex(
            r'<link\s+rel="canonical"\s+href="([^"]+?)"', webpage,
            'Canonical URL')
        return self.url_result(canonical_url, RutubeIE.ie_key())


class RutubePlaylistBaseIE(RutubeBaseIE):
    def _next_page_url(self, page_num, playlist_id, *args, **kwargs):
        return self._PAGE_TEMPLATE % (playlist_id, page_num)

    def _entries(self, playlist_id, *args, **kwargs):
        next_page_url = None
        for pagenum in itertools.count(1):
            page = self._download_json(
                next_page_url or self._next_page_url(
                    pagenum, playlist_id, *args, **kwargs),
                playlist_id, 'Downloading page %s' % pagenum)

            results = page.get('results')
            if not results or not isinstance(results, list):
                break

            for result in results:
                video_url = url_or_none(result.get('video_url'))
                if not video_url:
                    continue
                entry = self._extract_video(result, require_title=False)
                entry.update({
                    '_type': 'url',
                    'url': video_url,
                    'ie_key': RutubeIE.ie_key(),
                })
                yield entry

            next_page_url = page.get('next')
            if not next_page_url or not page.get('has_next'):
                break

    def _extract_playlist(self, playlist_id, *args, **kwargs):
        return self.playlist_result(
            self._entries(playlist_id, *args, **kwargs),
            playlist_id, kwargs.get('playlist_name'))

    def _real_extract(self, url):
        return self._extract_playlist(self._match_id(url))


class RutubeChannelIE(RutubePlaylistBaseIE):
    IE_NAME = 'rutube:channel'
    IE_DESC = 'Rutube channels'
    _VALID_URL = r'https?://rutube\.ru/tags/video/(?P<id>\d+)'
    _TESTS = [{
        'url': 'http://rutube.ru/tags/video/1800/',
        'info_dict': {
            'id': '1800',
        },
        'playlist_mincount': 68,
    }]

    _PAGE_TEMPLATE = 'http://rutube.ru/api/tags/video/%s/?page=%s&format=json'


class RutubeMovieIE(RutubePlaylistBaseIE):
    IE_NAME = 'rutube:movie'
    IE_DESC = 'Rutube movies'
    _VALID_URL = r'https?://rutube\.ru/metainfo/tv/(?P<id>\d+)'
    _TESTS = []

    _MOVIE_TEMPLATE = 'http://rutube.ru/api/metainfo/tv/%s/?format=json'
    _PAGE_TEMPLATE = 'http://rutube.ru/api/metainfo/tv/%s/video?page=%s&format=json'

    def _real_extract(self, url):
        movie_id = self._match_id(url)
        movie = self._download_json(
            self._MOVIE_TEMPLATE % movie_id, movie_id,
            'Downloading movie JSON')
        return self._extract_playlist(
            movie_id, playlist_name=movie.get('name'))


class RutubePersonIE(RutubePlaylistBaseIE):
    IE_NAME = 'rutube:person'
    IE_DESC = 'Rutube person videos'
    _VALID_URL = r'https?://rutube\.ru/video/person/(?P<id>\d+)'
    _TESTS = [{
        'url': 'http://rutube.ru/video/person/313878/',
        'info_dict': {
            'id': '313878',
        },
        'playlist_mincount': 37,
    }]

    _PAGE_TEMPLATE = 'http://rutube.ru/api/video/person/%s/?page=%s&format=json'


class RutubePlaylistIE(RutubePlaylistBaseIE):
    IE_NAME = 'rutube:playlist'
    IE_DESC = 'Rutube playlists'
    _VALID_URL = r'https?://rutube\.ru/(?:video|(?:play/)?embed)/[\da-z]{32}/\?.*?\bpl_id=(?P<id>\d+)'
    _TESTS = [{
        'url': 'https://rutube.ru/video/cecd58ed7d531fc0f3d795d51cee9026/?pl_id=3097&pl_type=tag',
        'info_dict': {
            'id': '3097',
        },
        'playlist_count': 27,
    }, {
        'url': 'https://rutube.ru/video/10b3a03fc01d5bbcc632a2f3514e8aab/?pl_id=4252&pl_type=source',
        'only_matching': True,
    }]

    _PAGE_TEMPLATE = 'http://rutube.ru/api/playlist/%s/%s/?page=%s&format=json'

    @classmethod
    def suitable(cls, url):
        if not super(RutubePlaylistIE, cls).suitable(url):
            return False
        params = compat_parse_qs(compat_urllib_parse_urlparse(url).query)
        return params.get('pl_type', [None])[0] and int_or_none(params.get('pl_id', [None])[0])

    def _next_page_url(self, page_num, playlist_id, item_kind):
        return self._PAGE_TEMPLATE % (item_kind, playlist_id, page_num)

    def _real_extract(self, url):
        qs = compat_parse_qs(compat_urllib_parse_urlparse(url).query)
        playlist_kind = qs['pl_type'][0]
        playlist_id = qs['pl_id'][0]
        return self._extract_playlist(playlist_id, item_kind=playlist_kind)
Unify coding cookie 2016-10-02 19:39:18 +08:00			`# coding: utf-8`
[rutube] Add support for channels and movies 2014-01-28 07:56:09 +08:00			`from __future__ import unicode_literals`

Add an extractor for rutube.ru (closes #1136) It downloads with a m3u8 manifest, requires ffmpeg. 2013-10-16 22:57:40 +08:00			`import re`
[rutube] Add support for channels and movies 2014-01-28 07:56:09 +08:00			`import itertools`
Add an extractor for rutube.ru (closes #1136) It downloads with a m3u8 manifest, requires ffmpeg. 2013-10-16 22:57:40 +08:00
			`from .common import InfoExtractor`
Fix imports and general cleanup · Import from compat what comes from compat. Yes, some names are available in utils too, but that's an implementation detail. · Use _match_id consistently whenever possible · Fix some outdated tests · Use consistent valid URL (always match the whole protocol, no ^ at start required) · Use modern test definitions 2014-12-13 19:24:42 +08:00			`from ..compat import (`
Add an extractor for rutube.ru (closes #1136) It downloads with a m3u8 manifest, requires ffmpeg. 2013-10-16 22:57:40 +08:00			`compat_str,`
[rutube:playlist] Add extractor (closes #13534) 2017-07-04 17:26:02 +08:00			`compat_parse_qs,`
			`compat_urllib_parse_urlparse,`
Fix imports and general cleanup · Import from compat what comes from compat. Yes, some names are available in utils too, but that's an implementation detail. · Use _match_id consistently whenever possible · Fix some outdated tests · Use consistent valid URL (always match the whole protocol, no ^ at start required) · Use modern test definitions 2014-12-13 19:24:42 +08:00			`)`
			`from ..utils import (`
[rutube] Extract all formats 2015-11-21 20:02:52 +08:00			`determine_ext,`
[rutube] Use bool_or_none 2017-09-10 20:09:27 +08:00			`bool_or_none,`
[rutube:playlist] Add extractor (closes #13534) 2017-07-04 17:26:02 +08:00			`int_or_none,`
[rutube] Use bool_or_none 2017-09-10 20:09:27 +08:00			`try_get,`
			`unified_timestamp,`
Improve URL extraction 2018-07-21 20:08:28 +08:00			`url_or_none,`
Add an extractor for rutube.ru (closes #1136) It downloads with a m3u8 manifest, requires ffmpeg. 2013-10-16 22:57:40 +08:00			`)`


[rutube] Rework and generalize playlist extractors (closes #13565) 2017-09-10 19:39:13 +08:00			`class RutubeBaseIE(InfoExtractor):`
			`def _extract_video(self, video, video_id=None, require_title=True):`
			`title = video['title'] if require_title else video.get('title')`

			`age_limit = video.get('is_adult')`
			`if age_limit is not None:`
			`age_limit = 18 if age_limit is True else 0`

			`uploader_id = try_get(video, lambda x: x['author']['id'])`
			`category = try_get(video, lambda x: x['category']['name'])`

			`return {`
			`'id': video.get('id') or video_id,`
			`'title': title,`
			`'description': video.get('description'),`
			`'thumbnail': video.get('thumbnail_url'),`
			`'duration': int_or_none(video.get('duration')),`
			`'uploader': try_get(video, lambda x: x['author']['name']),`
			`'uploader_id': compat_str(uploader_id) if uploader_id else None,`
			`'timestamp': unified_timestamp(video.get('created_ts')),`
			`'category': [category] if category else None,`
			`'age_limit': age_limit,`
			`'view_count': int_or_none(video.get('hits')),`
			`'comment_count': int_or_none(video.get('comments_count')),`
[rutube] Use bool_or_none 2017-09-10 20:09:27 +08:00			`'is_live': bool_or_none(video.get('is_livestream')),`
[rutube] Rework and generalize playlist extractors (closes #13565) 2017-09-10 19:39:13 +08:00			`}`


			`class RutubeIE(RutubeBaseIE):`
[rutube] Add support for channels and movies 2014-01-28 07:56:09 +08:00			`IE_NAME = 'rutube'`
[rutube] Simplify 2014-01-28 10:32:07 +08:00			`IE_DESC = 'Rutube videos'`
[rutube] Relax _VALID_URL 2017-03-04 01:42:51 +08:00			`_VALID_URL = r'https?://rutube\.ru/(?:video\|(?:play/)?embed)/(?P<id>[\da-z]{32})'`
Add an extractor for rutube.ru (closes #1136) It downloads with a m3u8 manifest, requires ffmpeg. 2013-10-16 22:57:40 +08:00
[rutube] Extend _VALID_URL 2015-12-16 06:44:17 +08:00			`_TESTS = [{`
[rutube] Add support for channels and movies 2014-01-28 07:56:09 +08:00			`'url': 'http://rutube.ru/video/3eac3b4561676c17df9132a9a1e62e3e/',`
[rutube] Rework and generalize playlist extractors (closes #13565) 2017-09-10 19:39:13 +08:00			`'md5': '79938ade01294ef7e27574890d0d3769',`
[rutube] Add support for channels and movies 2014-01-28 07:56:09 +08:00			`'info_dict': {`
[rutube] Modernize 2014-03-30 16:35:07 +08:00			`'id': '3eac3b4561676c17df9132a9a1e62e3e',`
[rutube] Rework and generalize playlist extractors (closes #13565) 2017-09-10 19:39:13 +08:00			`'ext': 'flv',`
[rutube] Add support for channels and movies 2014-01-28 07:56:09 +08:00			`'title': 'Раненный кенгуру забежал в аптеку',`
[rutube] Update test 2014-01-28 10:31:14 +08:00			`'description': 'http://www.ntdtv.ru ',`
			`'duration': 80,`
[rutube] Add support for channels and movies 2014-01-28 07:56:09 +08:00			`'uploader': 'NTDRussian',`
			`'uploader_id': '29790',`
[rutube] Rework and generalize playlist extractors (closes #13565) 2017-09-10 19:39:13 +08:00			`'timestamp': 1381943602,`
[rutube] Update test 2014-01-28 10:31:14 +08:00			`'upload_date': '20131016',`
[rutube] Add age_limit to test 2015-08-09 00:11:06 +08:00			`'age_limit': 0,`
Add an extractor for rutube.ru (closes #1136) It downloads with a m3u8 manifest, requires ffmpeg. 2013-10-16 22:57:40 +08:00			`},`
[rutube] Extend _VALID_URL 2015-12-16 06:44:17 +08:00			`}, {`
			`'url': 'http://rutube.ru/play/embed/a10e53b86e8f349080f718582ce4c661',`
			`'only_matching': True,`
[rutube] Relax _VALID_URL 2017-03-04 01:42:51 +08:00			`}, {`
			`'url': 'http://rutube.ru/embed/a10e53b86e8f349080f718582ce4c661',`
			`'only_matching': True,`
[rutube:playlist] Add extractor (closes #13534) 2017-07-04 17:26:02 +08:00			`}, {`
			`'url': 'http://rutube.ru/video/3eac3b4561676c17df9132a9a1e62e3e/?pl_id=4252',`
			`'only_matching': True,`
[rutube] Rework and generalize playlist extractors (closes #13565) 2017-09-10 19:39:13 +08:00			`}, {`
			`'url': 'https://rutube.ru/video/10b3a03fc01d5bbcc632a2f3514e8aab/?pl_type=source',`
			`'only_matching': True,`
[rutube] Extend _VALID_URL 2015-12-16 06:44:17 +08:00			`}]`
Add an extractor for rutube.ru (closes #1136) It downloads with a m3u8 manifest, requires ffmpeg. 2013-10-16 22:57:40 +08:00
[rutube:playlist] Add extractor (closes #13534) 2017-07-04 17:26:02 +08:00			`@classmethod`
			`def suitable(cls, url):`
[rutube] Rework and generalize playlist extractors (closes #13565) 2017-09-10 19:39:13 +08:00			`return False if RutubePlaylistIE.suitable(url) else super(RutubeIE, cls).suitable(url)`
[rutube:playlist] Add extractor (closes #13534) 2017-07-04 17:26:02 +08:00
[generic] Add support for rutube embeds 2017-03-04 01:46:33 +08:00			`@staticmethod`
			`def _extract_urls(webpage):`
			`return [mobj.group('url') for mobj in re.finditer(`
			`r'<iframe[^>]+?src=(["\'])(?P<url>(?:https?:)?//rutube\.ru/embed/[\da-z]{32}.*?)\1',`
			`webpage)]`

Add an extractor for rutube.ru (closes #1136) It downloads with a m3u8 manifest, requires ffmpeg. 2013-10-16 22:57:40 +08:00			`def _real_extract(self, url):`
Fix imports and general cleanup · Import from compat what comes from compat. Yes, some names are available in utils too, but that's an implementation detail. · Use _match_id consistently whenever possible · Fix some outdated tests · Use consistent valid URL (always match the whole protocol, no ^ at start required) · Use modern test definitions 2014-12-13 19:24:42 +08:00			`video_id = self._match_id(url)`
[rutube] Rework and generalize playlist extractors (closes #13565) 2017-09-10 19:39:13 +08:00
[rutube] Use _download_json 2014-03-30 17:26:35 +08:00			`video = self._download_json(`
[rutube] Modernize 2014-03-30 16:35:07 +08:00			`'http://rutube.ru/api/video/%s/?format=json' % video_id,`
			`video_id, 'Downloading video JSON')`
[rutube] Use _download_json 2014-03-30 17:26:35 +08:00
[rutube] Rework and generalize playlist extractors (closes #13565) 2017-09-10 19:39:13 +08:00			`info = self._extract_video(video, video_id)`
[rutube] Fix extraction 2014-04-19 16:59:12 +08:00
			`options = self._download_json(`
[rutube] Add missing whitespace 2014-04-21 20:04:11 +08:00			`'http://rutube.ru/api/play/options/%s/?format=json' % video_id,`
[rutube] Use geo verification headers (closes #17897) 2018-10-17 00:19:44 +08:00			`video_id, 'Downloading options JSON',`
			`headers=self.geo_verification_headers())`
[rutube] Fix extraction 2014-04-19 16:59:12 +08:00
[rutube] Extract all formats 2015-11-21 20:02:52 +08:00			`formats = []`
			`for format_id, format_url in options['video_balancer'].items():`
			`ext = determine_ext(format_url)`
			`if ext == 'm3u8':`
Simplify formats accumulation for f4m/m3u8/smil formats Now all _extract_*_formats routines return a list 2015-12-29 02:58:24 +08:00			`formats.extend(self._extract_m3u8_formats(`
			`format_url, video_id, 'mp4', m3u8_id=format_id, fatal=False))`
[rutube] Extract all formats 2015-11-21 20:02:52 +08:00			`elif ext == 'f4m':`
Simplify formats accumulation for f4m/m3u8/smil formats Now all _extract_*_formats routines return a list 2015-12-29 02:58:24 +08:00			`formats.extend(self._extract_f4m_formats(`
			`format_url, video_id, f4m_id=format_id, fatal=False))`
[rutube] Extract all formats 2015-11-21 20:02:52 +08:00			`else:`
			`formats.append({`
			`'url': format_url,`
			`'format_id': format_id,`
			`})`
			`self._sort_formats(formats)`
Add an extractor for rutube.ru (closes #1136) It downloads with a m3u8 manifest, requires ffmpeg. 2013-10-16 22:57:40 +08:00
[rutube] Rework and generalize playlist extractors (closes #13565) 2017-09-10 19:39:13 +08:00			`info['formats'] = formats`
			`return info`
[rutube] Add support for channels and movies 2014-01-28 07:56:09 +08:00

[vk] Add support for rutube embeds (Fixes #4514) 2015-01-04 10:15:27 +08:00			`class RutubeEmbedIE(InfoExtractor):`
			`IE_NAME = 'rutube:embed'`
			`IE_DESC = 'Rutube embedded videos'`
Add missing r prefix for _VALID_URLs 2016-09-08 18:04:57 +08:00			`_VALID_URL = r'https?://rutube\.ru/(?:video\|play)/embed/(?P<id>[0-9]+)'`
[vk] Add support for rutube embeds (Fixes #4514) 2015-01-04 10:15:27 +08:00
[rutube:embed] Extend _VALID_URL (Closes #7588) 2015-11-21 19:39:24 +08:00			`_TESTS = [{`
[vk] Add support for rutube embeds (Fixes #4514) 2015-01-04 10:15:27 +08:00			`'url': 'http://rutube.ru/video/embed/6722881?vk_puid37=&vk_puid38=',`
			`'info_dict': {`
			`'id': 'a10e53b86e8f349080f718582ce4c661',`
[rutube] Rework and generalize playlist extractors (closes #13565) 2017-09-10 19:39:13 +08:00			`'ext': 'flv',`
			`'timestamp': 1387830582,`
[vk] Add support for rutube embeds (Fixes #4514) 2015-01-04 10:15:27 +08:00			`'upload_date': '20131223',`
			`'uploader_id': '297833',`
			`'description': 'Видео группы ★http://vk.com/foxkidsreset★ музей Fox Kids и Jetix<br/><br/> восстановлено и сделано в шикоформате subziro89 http://vk.com/subziro89',`
			`'uploader': 'subziro89 ILya',`
			`'title': 'Мистический городок Эйри в Индиан 5 серия озвучка subziro89',`
			`},`
			`'params': {`
[rutube] Rework and generalize playlist extractors (closes #13565) 2017-09-10 19:39:13 +08:00			`'skip_download': True,`
[vk] Add support for rutube embeds (Fixes #4514) 2015-01-04 10:15:27 +08:00			`},`
[rutube:embed] Extend _VALID_URL (Closes #7588) 2015-11-21 19:39:24 +08:00			`}, {`
			`'url': 'http://rutube.ru/play/embed/8083783',`
			`'only_matching': True,`
			`}]`
[vk] Add support for rutube embeds (Fixes #4514) 2015-01-04 10:15:27 +08:00
			`def _real_extract(self, url):`
			`embed_id = self._match_id(url)`
			`webpage = self._download_webpage(url, embed_id)`

			`canonical_url = self._html_search_regex(`
			`r'<link\s+rel="canonical"\s+href="([^"]+?)"', webpage,`
			`'Canonical URL')`
[rutube] Rework and generalize playlist extractors (closes #13565) 2017-09-10 19:39:13 +08:00			`return self.url_result(canonical_url, RutubeIE.ie_key())`
[vk] Add support for rutube embeds (Fixes #4514) 2015-01-04 10:15:27 +08:00

[rutube] Rework and generalize playlist extractors (closes #13565) 2017-09-10 19:39:13 +08:00			`class RutubePlaylistBaseIE(RutubeBaseIE):`
			`def _next_page_url(self, page_num, playlist_id, args, *kwargs):`
			`return self._PAGE_TEMPLATE % (playlist_id, page_num)`

			`def _entries(self, playlist_id, args, *kwargs):`
			`next_page_url = None`
			`for pagenum in itertools.count(1):`
			`page = self._download_json(`
			`next_page_url or self._next_page_url(`
			`pagenum, playlist_id, args, *kwargs),`
			`playlist_id, 'Downloading page %s' % pagenum)`

			`results = page.get('results')`
			`if not results or not isinstance(results, list):`
			`break`

			`for result in results:`
Improve URL extraction 2018-07-21 20:08:28 +08:00			`video_url = url_or_none(result.get('video_url'))`
			`if not video_url:`
[rutube] Rework and generalize playlist extractors (closes #13565) 2017-09-10 19:39:13 +08:00			`continue`
			`entry = self._extract_video(result, require_title=False)`
			`entry.update({`
			`'_type': 'url',`
			`'url': video_url,`
			`'ie_key': RutubeIE.ie_key(),`
			`})`
			`yield entry`

			`next_page_url = page.get('next')`
			`if not next_page_url or not page.get('has_next'):`
			`break`

			`def _extract_playlist(self, playlist_id, args, *kwargs):`
			`return self.playlist_result(`
			`self._entries(playlist_id, args, *kwargs),`
			`playlist_id, kwargs.get('playlist_name'))`

			`def _real_extract(self, url):`
			`return self._extract_playlist(self._match_id(url))`


			`class RutubeChannelIE(RutubePlaylistBaseIE):`
[rutube] Add support for channels and movies 2014-01-28 07:56:09 +08:00			`IE_NAME = 'rutube:channel'`
[rutube] Simplify 2014-01-28 10:32:07 +08:00			`IE_DESC = 'Rutube channels'`
Add support for https for all extractors as preventive and future-proof measure 2016-03-21 23:36:32 +08:00			`_VALID_URL = r'https?://rutube\.ru/tags/video/(?P<id>\d+)'`
Move playlist tests to extractors. From now on, test_download will run these tests. That means we benefit not only from the networking setup in there, but also from the other tests (for example test_all_urls to find problems with _VALID_URLs). 2014-08-28 06:58:24 +08:00			`_TESTS = [{`
			`'url': 'http://rutube.ru/tags/video/1800/',`
			`'info_dict': {`
			`'id': '1800',`
			`},`
			`'playlist_mincount': 68,`
			`}]`
[rutube] Add support for channels and movies 2014-01-28 07:56:09 +08:00
			`_PAGE_TEMPLATE = 'http://rutube.ru/api/tags/video/%s/?page=%s&format=json'`


[rutube] Rework and generalize playlist extractors (closes #13565) 2017-09-10 19:39:13 +08:00			`class RutubeMovieIE(RutubePlaylistBaseIE):`
[rutube] Add support for channels and movies 2014-01-28 07:56:09 +08:00			`IE_NAME = 'rutube:movie'`
[rutube] Simplify 2014-01-28 10:32:07 +08:00			`IE_DESC = 'Rutube movies'`
Add support for https for all extractors as preventive and future-proof measure 2016-03-21 23:36:32 +08:00			`_VALID_URL = r'https?://rutube\.ru/metainfo/tv/(?P<id>\d+)'`
Move playlist tests to extractors. From now on, test_download will run these tests. That means we benefit not only from the networking setup in there, but also from the other tests (for example test_all_urls to find problems with _VALID_URLs). 2014-08-28 06:58:24 +08:00			`_TESTS = []`
[rutube] Add support for channels and movies 2014-01-28 07:56:09 +08:00
			`_MOVIE_TEMPLATE = 'http://rutube.ru/api/metainfo/tv/%s/?format=json'`
			`_PAGE_TEMPLATE = 'http://rutube.ru/api/metainfo/tv/%s/video?page=%s&format=json'`

			`def _real_extract(self, url):`
Fix imports and general cleanup · Import from compat what comes from compat. Yes, some names are available in utils too, but that's an implementation detail. · Use _match_id consistently whenever possible · Fix some outdated tests · Use consistent valid URL (always match the whole protocol, no ^ at start required) · Use modern test definitions 2014-12-13 19:24:42 +08:00			`movie_id = self._match_id(url)`
[rutube] Use _download_json 2014-03-30 17:26:35 +08:00			`movie = self._download_json(`
[rutube] Simplify 2014-01-28 10:32:07 +08:00			`self._MOVIE_TEMPLATE % movie_id, movie_id,`
			`'Downloading movie JSON')`
[rutube] Rework and generalize playlist extractors (closes #13565) 2017-09-10 19:39:13 +08:00			`return self._extract_playlist(`
			`movie_id, playlist_name=movie.get('name'))`
[rutube] Add support for user videos 2014-01-28 09:47:17 +08:00

[rutube] Rework and generalize playlist extractors (closes #13565) 2017-09-10 19:39:13 +08:00			`class RutubePersonIE(RutubePlaylistBaseIE):`
[rutube] Add support for user videos 2014-01-28 09:47:17 +08:00			`IE_NAME = 'rutube:person'`
			`IE_DESC = 'Rutube person videos'`
Add support for https for all extractors as preventive and future-proof measure 2016-03-21 23:36:32 +08:00			`_VALID_URL = r'https?://rutube\.ru/video/person/(?P<id>\d+)'`
Move playlist tests to extractors. From now on, test_download will run these tests. That means we benefit not only from the networking setup in there, but also from the other tests (for example test_all_urls to find problems with _VALID_URLs). 2014-08-28 06:58:24 +08:00			`_TESTS = [{`
			`'url': 'http://rutube.ru/video/person/313878/',`
			`'info_dict': {`
			`'id': '313878',`
			`},`
			`'playlist_mincount': 37,`
			`}]`
[rutube] Add support for user videos 2014-01-28 09:47:17 +08:00
[rutube] Simplify 2014-01-28 10:32:07 +08:00			`_PAGE_TEMPLATE = 'http://rutube.ru/api/video/person/%s/?page=%s&format=json'`
[rutube:playlist] Add extractor (closes #13534) 2017-07-04 17:26:02 +08:00

[rutube] Rework and generalize playlist extractors (closes #13565) 2017-09-10 19:39:13 +08:00			`class RutubePlaylistIE(RutubePlaylistBaseIE):`
[rutube:playlist] Add extractor (closes #13534) 2017-07-04 17:26:02 +08:00			`IE_NAME = 'rutube:playlist'`
			`IE_DESC = 'Rutube playlists'`
[rutube] Rework and generalize playlist extractors (closes #13565) 2017-09-10 19:39:13 +08:00			`_VALID_URL = r'https?://rutube\.ru/(?:video\|(?:play/)?embed)/[\da-z]{32}/\?.*?\bpl_id=(?P<id>\d+)'`
[rutube:playlist] Add extractor (closes #13534) 2017-07-04 17:26:02 +08:00			`_TESTS = [{`
[rutube] Rework and generalize playlist extractors (closes #13565) 2017-09-10 19:39:13 +08:00			`'url': 'https://rutube.ru/video/cecd58ed7d531fc0f3d795d51cee9026/?pl_id=3097&pl_type=tag',`
[rutube:playlist] Add extractor (closes #13534) 2017-07-04 17:26:02 +08:00			`'info_dict': {`
[rutube] Rework and generalize playlist extractors (closes #13565) 2017-09-10 19:39:13 +08:00			`'id': '3097',`
[rutube:playlist] Add extractor (closes #13534) 2017-07-04 17:26:02 +08:00			`},`
[rutube] Rework and generalize playlist extractors (closes #13565) 2017-09-10 19:39:13 +08:00			`'playlist_count': 27,`
			`}, {`
			`'url': 'https://rutube.ru/video/10b3a03fc01d5bbcc632a2f3514e8aab/?pl_id=4252&pl_type=source',`
			`'only_matching': True,`
[rutube:playlist] Add extractor (closes #13534) 2017-07-04 17:26:02 +08:00			`}]`

[rutube] Rework and generalize playlist extractors (closes #13565) 2017-09-10 19:39:13 +08:00			`_PAGE_TEMPLATE = 'http://rutube.ru/api/playlist/%s/%s/?page=%s&format=json'`
[rutube:playlist] Add extractor (closes #13534) 2017-07-04 17:26:02 +08:00
[rutube:playlist] Fix suitable (closes #14166) 2017-09-11 04:22:27 +08:00			`@classmethod`
			`def suitable(cls, url):`
			`if not super(RutubePlaylistIE, cls).suitable(url):`
			`return False`
[rutube:playlist] Add extractor (closes #13534) 2017-07-04 17:26:02 +08:00			`params = compat_parse_qs(compat_urllib_parse_urlparse(url).query)`
[rutube] Rework and generalize playlist extractors (closes #13565) 2017-09-10 19:39:13 +08:00			`return params.get('pl_type', [None])[0] and int_or_none(params.get('pl_id', [None])[0])`
[rutube:playlist] Add extractor (closes #13534) 2017-07-04 17:26:02 +08:00
[rutube] Rework and generalize playlist extractors (closes #13565) 2017-09-10 19:39:13 +08:00			`def _next_page_url(self, page_num, playlist_id, item_kind):`
			`return self._PAGE_TEMPLATE % (item_kind, playlist_id, page_num)`
[rutube:playlist] Add extractor (closes #13534) 2017-07-04 17:26:02 +08:00
[rutube] Rework and generalize playlist extractors (closes #13565) 2017-09-10 19:39:13 +08:00			`def _real_extract(self, url):`
			`qs = compat_parse_qs(compat_urllib_parse_urlparse(url).query)`
			`playlist_kind = qs['pl_type'][0]`
			`playlist_id = qs['pl_id'][0]`
			`return self._extract_playlist(playlist_id, item_kind=playlist_kind)`