1
0
mirror of https://github.com/l1ving/youtube-dl synced 2025-01-21 11:52:52 +08:00

[europawebcast] Add extractor

This commit is contained in:
0x9fff00 2020-06-10 22:05:52 +02:00
parent e1723c4bac
commit d19a2e6abe
No known key found for this signature in database
GPG Key ID: 86AD72D07B1EC224
2 changed files with 77 additions and 0 deletions

View File

@ -0,0 +1,76 @@
# coding: utf-8
from __future__ import unicode_literals
from .common import InfoExtractor
class EuropaWebcastIE(InfoExtractor):
_VALID_URL = r'https?://webcast.ec.europa.eu/(?P<id>[^/?#&]+)'
_TEST = {
'url': 'https://webcast.ec.europa.eu/copyright-stakeholder-dialogues',
'md5': 'cb2873afec20f44a6521eb99b90864ec',
'info_dict': {
'id': 'copyright-stakeholder-dialogues',
'ext': 'mp4',
'title': 'COPYRIGHT STAKEHOLDER DIALOGUES',
'timestamp': 1571126116,
'upload_date': '20191015',
'duration': 21600,
},
}
def _real_extract(self, url):
video_id = self._match_id(url)
webpage = self._download_webpage(url, video_id)
session_data = self._parse_json(
self._search_regex(r'var\s+sessionData\s*=\s*({.+});', webpage,
'session data', fatal=False), video_id)
media_setup = self._parse_json(
self._search_regex(r'var\s+mediaSetup\s*=\s*({.+});', webpage,
'media setup'), video_id)
playlist_item = media_setup['playlist'][0]
title = session_data.get('name') or self._html_search_regex(
r'<span[^>]+class="[^"]*(?:pageSectionTitle|sessionTitle)[^>]+>([^<]+)</span>',
webpage, 'title')
start_time = playlist_item.get('startUTC')
stop_time = playlist_item.get('stopUTC')
if start_time and stop_time:
duration = stop_time - start_time
else:
duration = None
source_data = playlist_item['source']
base_url = 'https://%s/%s/' % (
media_setup['server'], media_setup['application'])
formats = []
for lang in source_data['languages']:
lang_formats = []
for quality in source_data['qualities']:
lang_formats.extend(self._extract_m3u8_formats(
'%s%s/playlist.m3u8?tracks=%s' % (
base_url, source_data['qualities'][quality], lang), video_id,
ext='mp4', entry_protocol='m3u8_native',
m3u8_id='%s-%s' % (quality, lang)))
if lang == 'or':
for fmt in lang_formats:
fmt['preference'] = 1 # prefer original language
else:
for fmt in lang_formats:
fmt['language'] = lang
formats.extend(lang_formats)
self._sort_formats(formats)
return {
'id': video_id,
'title': title,
'formats': formats,
'timestamp': start_time,
'duration': duration,
}

View File

@ -327,6 +327,7 @@ from .espn import (
) )
from .esri import EsriVideoIE from .esri import EsriVideoIE
from .europa import EuropaIE from .europa import EuropaIE
from .europawebcast import EuropaWebcastIE
from .everyonesmixtape import EveryonesMixtapeIE from .everyonesmixtape import EveryonesMixtapeIE
from .expotv import ExpoTVIE from .expotv import ExpoTVIE
from .expressen import ExpressenIE from .expressen import ExpressenIE